In [4]:
import os
import ast
import json
import ineqpy
import numpy as np
import pandas as pd
import plotly.io as pio
import plotly.express as px
import plotly.graph_objects as go

from pathlib import Path
from collections import defaultdict

In [5]:
path_meta = Path("../meta")
path_data = Path("../data")
path_key = Path("../key")
font_size = 15

workflow_pwc = ['1']
display_format_pwc = ['Rankable Table', 'Scatter Plot']
display_format_rankable = ['Rankable Table', 'Rankable Bar Chart']
workflow_patterns_with_submission = ['1', '2', '3', '4', '5']
non_accepted_publication_type = ['blog', 'report', 'white paper']

leaderboard_system_without_evaluation_datasets = ['Ko Chatbot Arena']
leaderboard_system_without_pull_requests = ['SEAL', 'FSMBench', 'CompMix', 'DocVQA', 'GENIE', 'InfographicVQA', 'LMExamQA', 'Models Leaderboard', 'MP-DocVQA', 'OpenEval', 'Program Synthesis Models Leaderboard', 'ProtoQA', 'TextSynth Server']
leaderboard_system_without_contacts = ['OpenEval']
leaderboard_system_without_documentation = ['FSMBench']
leaderboard_system_without_evaluation_harness = ['LLM-Leaderboard']

macro_display_format_mapping = {
    'Table': ['Regular Table', 'Rankable Table', 'Table Screenshot'],
    'Figure': ['Bar Chart', 'Box Plot', 'Heat Map', 'Line Chart', 'Pie Chart', 'Radar Chart', 'Scatter Plot', 'Rankable Bar Chart'],
}

platform_abbreviation_mapping = {
    'gh': 'GitHub',
    'hf': 'Hugging Face Spaces',
    'pwc': 'Papers With Code',
    'ip': 'independent platform',
}

ranking_dataframe_organization_tactics_mapping = {
    'Algorithm': ['Algorithm'],
    'Evaluation Configuration': ['Dataset Slice', 'Evaluator', 'Metric'],
    'Leaderboard Aggregation': ['Aggregated Result'],
    'Leaderboard Release': ['Leaderboard Launch Date', 'Leaderboard Version'],
    'Model Capability': ['Benchmark Dataset', 'Service Load', 'Supported Functionality', 'Supported Language', 'Supported Modality', 'Task'],
    'Model Information': ['Model Accessibility', 'Model Size', 'Model Type'],
    'Prompt Engineering': ['#Prompt Example', 'Output Length', 'Prompt Design', 'Prompt Length', 'Relation Extractor', 'Tokenizer']
}

publisher_synonyms = {
    'Alibaba Group': ['DAMO Academy', 'Aliyun'],
    'Amazon': ['Alexa AI Lab', 'AWS AI Lab'],
    'Agency for Science Technology and Research': ['A*STAR I2R', 'CFAR A*STAR'],
    'Bauhaus University': ['Bauhaus University Weimar'],
    'ByteDance': ['ByteDance AI Lab'],
    'Chinese Academy of Sciences': ['University of Chinese Academy of Sciences'],
    'CSIRO': ['Data61'],
    'Fraunhofer Society': ['Fraunhofer Institute for Integrated Circuits'],
    'Frédéric Joliot Institute for Life Sciences': ['NeuroSpin'],
    'Google': ['Google Brain', 'Google DeepMind', 'Google Blueshift'],
    'Huawei': ["Huawei Noah's Ark Lab"],
    'Jingdong': ['Explore Academy'],
    'Kunlun Tech': ['Skywork'],
    'Max Planck Society': ['Max Planck Institute for Informatics', 'Max Planck Institute for Intelligent Systems', 'Max Planck Institute for Mathematics in the Sciences'],
    'Meta': [
        'Meta FAIR',
        'Meta GenAI'
    ],
    'Microsoft': ['Microsoft Research Asia'],
    'National Public School': ['National Public School HSR Layout'],
    'Naver': ['Naver Labs Europe'],
    'Queen\'s University Kingston': ['Queen\'s University'],
    'Tencent': [
        'Tencent AI Lab',
        'Tencent ARC Lab',
        'Tencent Youtu Lab'
    ],
    'Toyota Technological Institute': ['Toyota Technological Institute Chicago'],
    'University of California': [
        'University of California Berkeley',
        'University of California Davis',
        'University of California Irvine',
        'University of California Los Angeles',
        'University of California Santa Barbara',
        'University of California Santa Cruz',
        'University of California San Diego',
    ],
    'University of Michigan': ['University of Michigan Ann Arbor'],
    'University of North Carolina': ['University of North Carolina Chapel Hill'],
    'University of Illinois': ['University of Illinois Chicago', 'University of Illinois Urbana Champaign'],
    'University of Massachusetts': ['University of Massachusetts Amherst'],
    'University of Maryland': ['University of Maryland College Park'],
    'University of Tennessee': ['University of Tennessee Knoxville'],
    'University of Texas': ['University of Texas Austin'],
    'University of Wisconsin': ['University of Wisconsin Madison'],
}

metrics_synonyms = {
    'accuracy': [
        'acc',
        'accuarcy',
        'qa accuracy'
    ],
    'average': [
        'avg',
        '平均'
    ],
    'average accuracy': [
        'avg. accuracy'
    ],
    'average score': ['平均分'],
    'bleu': ['bleu score'],
    'bleu-1': [
        'narrativeqa bleu-1',
        'socialiqa bleu-1',
        'mcscript bleu-1',
        'cosmosqa bleu-1'
    ],
    'bleu-4': ['bleu4'],
    'bertscore': ['bert score'],
    'code': ['代码'],
    'elo rating': [
        'chatbot arena elo',
        'elo'
    ],
    'exact match': ['em', 'exact match accuracy'],
    'lerc': [
        'cosmosqa lerc',
        'mcscript lerc',
        'socialiqa lerc',
        'narrativeqa lerc'
    ],
    'link': ['url'],
    'mean rank': [
        'text-to-video mean rank',
        'video-to-text mean rank'
    ],
    'median rank': [
        'text-to-video median rank',
        'video-to-text median rank',
        'text-to-videomedian rank',
        'text-to-video medianr'
    ],
    'meteor': [
        'cosmosqa meteor',
        'narrativeqa meteor',
        'socialiqa meteor',
        'mcscript meteor'
    ],
    'neg mean rank': [
        'i->t neg mean rank',
        't->i neg mean rank'
    ],
    'organization': [
        '发布机构',
        '机构',
        'orgaisation',
    ],
    'others': ['其他'],
    'overall': ['xiezhi overall'],
    'overall score': [
        '总分',
        '总体分数'
    ],
    'pass@1': [
        'interview pass@1',
        'competition pass@1',
        'introductory pass@1'
    ],
    'pass@5': [
        'interview pass@5',
        'introductory pass@5',
        'competition pass@5'
    ],
    'pass@1000': [
        'interview pass@1000',
        'competition pass@1000',
        'introductory pass@1000'
    ],
    'pass@any': [
        'introductory pass@any',
        'competition pass@any',
        'interview pass@any'
    ],
    '#parameters':  [
        '#p',
        '#params',
        '# params',
        '#size',
        '参数量',
        'model size',
        'model size/b',
        'number of params',
        'param',
        'parameters',
        'params',
        'size'
    ],
    'perplexity': ['ppl'],
    'precision@1': ['i->t p@1'],
    'precision@20': ['p@20'],
    'recall@1': [
        'r@1',
        'text-to-videor@1',
        'video-to-text r@1',
        'text-to-video r@1',
        'text-to-image r@1',
        'image-to-text r@1'
    ],
    'recall@5': [
        'text-to-image r@5',
        'video-to-text r@5',
        'image-to-text r@5',
        'text-to-video r@5',
        'r@5',
    ],
    'recall@10': [
        'recall@10 on 1 rounds',
        'recall@10 on 2 rounds',
        'recall@10 on 3 rounds',
        'r@10',
        'video-to-text r@10',
        'text-to-image r@10',
        'text-to-video r@10',
        'image-to-text r@10'
    ],
    'recall@50': [
        'text-to-video r@50',
        'video-to-text r@50',
    ],
    'score': ['分数'],
    'submission date': ['提交时间'],
    'top-1 accuracy': ['top 1 accuracy'],
    'top-5 accuracy': ['top 5 accuracy'],
    'type': ['model type'],
    'win rate': ['胜率'],
    'word error rate': ['wer']
}

pwc_leaderboard_mapping = {
    'A-OKVQA': ['visual-question-answering-on-a-okvqa'],
    'ACE (2005)': ['relation-extraction-on-ace-2005'],
    'ADE20K': ['semantic-segmentation-on-ade20k'],
    'AI2D': ['visual-question-answering-vqa-on-ai2d'],
    'AISHELL-1': ['speech-recognition-on-aishell-1'],
    'ANLI': ['natural-language-inference-on-anli-test'],
    'APPS': ['code-generation-on-apps'],
    'ARC Challenge': ['common-sense-reasoning-on-arc-challenge', 'common-sense-reasoning-on-arc-easy'],
    'ASDiv': ['math-word-problem-solving-on-asdiv-a'],
    'AVA': ['action-recognition-on-ava-v2-2', 'spatio-temporal-action-localization-on-ava'],
    'ActivityNet Captions': ['video-captioning-on-activitynet-captions', 'video-captioning-on-activitynet-captions'],
    'ActivityNet': ['temporal-action-localization-on-activitynet', 'video-retrieval-on-activitynet', 'zero-shot-video-retrieval-on-activitynet'],
    'ActivityNet-QA': ['video-question-answering-on-activitynet-qa'],
    'AudioCaps': ['audio-to-text-retrieval-on-audiocaps', 'text-to-audio-retrieval-on-audiocaps', 'zero-shot-audio-captioning-on-audiocaps'],
    'BACE': ['molecular-property-prediction-on-bace-1'],
    'BANKING77': ['intent-detection-on-banking77'],
    'BBBP': ['molecular-property-prediction-on-bbbp-1'],
    'BBH': ['multi-task-language-understanding-on-bbh-nlp', 'multi-task-language-understanding-on-bbh-alg'],
    'BC5CDR': ['named-entity-recognition-ner-on-bc5cdr'],
    'BEIR': ['argument-retrieval-on-arguana-beir', 'argument-retrieval-on-touche-2020-beir', 'biomedical-information-retrieval-on-bioasq-1', 'biomedical-information-retrieval-on-nfcorpus-1', 'biomedical-information-retrieval-on-trec-1', 'citation-prediction-on-scidocs-beir', 'duplicate-question-retrieval-on-cqadupstack-1', 'duplicate-question-retrieval-on-quora-beir', 'entity-retrieval-on-dbpedia-beir', 'fact-checking-on-scifact-beir', 'fact-checking-on-fever-beir', 'fact-checking-on-climate-fever-beir', 'zero-shot-text-search-on-beir', 'news-retrieval-on-trec-news-beir', 'passage-retrieval-on-msmarco-beir', 'question-answering-on-fiqa-2018-beir', 'question-answering-on-hotpotqa-beir', 'tweet-retrieval-on-signal-1m-rt-beir'],
    'BIG-Bench': ['mathematical-induction-on-big-bench', 'physics-mc-on-big-bench', 'riddle-sense-on-big-bench', 'figure-of-speech-detection-on-big-bench', 'fantasy-reasoning-on-big-bench', 'common-sense-reasoning-on-big-bench-logical', 'logical-reasoning-on-big-bench-logical', 'analogical-similarity-on-big-bench', 'implicit-relations-on-big-bench', 'intent-recognition-on-big-bench', 'lambada-on-big-bench', 'movie-dialog-same-or-different-on-big-bench', 'nonsense-words-grammar-on-big-bench', 'phrase-relatedness-on-big-bench', 'question-selection-on-big-bench', 'misconceptions-on-big-bench', 'sentence-ambiguity-on-big-bench', 'general-knowledge-on-big-bench', 'analytic-entailment-on-big-bench', 'entailed-polarity-on-big-bench', 'epistemic-reasoning-on-big-bench', 'evaluating-information-essentiality-on-big', 'logical-args-on-big-bench', 'metaphor-boolean-on-big-bench', 'physical-intuition-on-big-bench', 'presuppositions-as-nli-on-big-bench', 'discourse-marker-prediction-on-big-bench', 'empirical-judgments-on-big-bench', 'irony-identification-on-big-bench', 'english-proverbs-on-big-bench', 'similarities-abstraction-on-big-bench', 'gre-reading-comprehension-on-big-bench', 'crash-blossom-on-big-bench', 'human-organs-senses-multiple-choice-on-big', 'odd-one-out-on-big-bench', 'identify-odd-metapor-on-big-bench', 'dark-humor-detection-on-big-bench', 'understanding-fables-on-big-bench', 'timedial-on-big-bench', 'common-sense-reasoning-on-big-bench-known', 'language-modelling-on-big-bench-lite', 'auto-debugging-on-big-bench-lite', 'memorization-on-big-bench-hindu-knowledge', 'logical-reasoning-on-big-bench-strategyqa', 'logical-reasoning-on-big-bench-logic-grid', 'crass-ai-on-big-bench', 'multiple-choice-question-answering-mcqa-on-31', 'word-sense-disambiguation-on-big-bench', 'multi-task-language-understanding-on-bbh-alg', 'sarcasm-detection-on-big-bench-snarks', 'common-sense-reasoning-on-big-bench-sports', 'multiple-choice-question-answering-mcqa-on-30', 'logical-reasoning-on-big-bench-temporal', 'common-sense-reasoning-on-big-bench', 'common-sense-reasoning-on-big-bench-causal', 'common-sense-reasoning-on-big-bench-date', 'logical-reasoning-on-big-bench-formal', 'multiple-choice-question-answering-mcqa-on-27', 'multiple-choice-question-answering-mcqa-on-28', 'multiple-choice-question-answering-mcqa-on-29', 'logical-reasoning-on-big-bench-penguins-in-a', 'logical-reasoning-on-big-bench-reasoning', 'multi-task-language-understanding-on-bbh-nlp'],
    'BenchLMM': ['visual-question-answering-on-benchlmm'],
    'BioASQ': ['question-answering-on-bioasq'],
    'BioLAMA': ['knowledge-probing-on-biolama'],
    'BoolQ': ['question-answering-on-boolq'],
    'C4': ['language-modelling-on-c4'],
    'CB': ['natural-language-inference-on-commitmentbank'],
    'CFQ': ['semantic-parsing-on-cfq'],
    'CIFAR-10': ['image-classification-on-cifar-10'],
    'CLUE': ['language-modelling-on-clue-afqmc', 'language-modelling-on-clue-ocnli-50k', 'language-modelling-on-clue-drcd', 'language-modelling-on-clue-cmnli', 'language-modelling-on-clue-wsc1-1', 'language-modelling-on-clue-c3', 'language-modelling-on-clue-cmrc2018'],
    'CNN DM': ['document-summarization-on-cnn-daily-mail', 'abstractive-text-summarization-on-cnn-daily'],
    'COCO Captions': ['image-captioning-on-coco-captions'],
    'COPA': ['question-answering-on-copa'],
    'ChEBI-20': ['cross-modal-retrieval-on-chebi-20', 'text-based-de-novo-molecule-generation-on', 'molecule-captioning-on-chebi-20'],
    'Charades': ['zero-shot-action-recognition-on-charades-1'],
    'Charades-STA': ['moment-retrieval-on-charades-sta'],
    'ChartQA': ['chart-question-answering-on-chartqa'],
    'Civil Comments': ['toxic-comment-classification-on-civil'],
    'Clotho': ['text-to-audio-retrieval-on-clotho', 'audio-captioning-on-clotho', 'audio-to-text-retrieval-on-clotho', 'zero-shot-text-to-audio-retrieval-on-clotho'],
    'CoLA': ['linguistic-acceptability-on-cola'],
    'CoNLL': ['coreference-resolution-on-conll-2012', 'coreference-resolution-on-conll12', 'joint-entity-and-relation-extraction-on-2', 'named-entity-recognition-ner-on-conll-2003', 'named-entity-recognition-on-conll03', 'relation-extraction-on-conll04', 'semantic-role-labeling-on-conll-2005', 'semantic-role-labeling-on-conll05-wsj', 'semantic-role-labeling-on-conll12'],
    'CoNaLa': ['code-generation-on-conala'],
    'CoQA': ['question-answering-on-coqa'],
    'CodeContests': ['code-generation-on-codecontests'],
    'Common Voice': ['speech-recognition-on-common-voice-8-0-13', 'speech-recognition-on-common-voice-8-0-14', 'speech-recognition-on-common-voice-8-0-35', 'speech-recognition-on-common-voice-8-0-21', 'speech-recognition-on-common-voice-8-0-19', 'speech-recognition-on-common-voice-8-0-15', 'speech-recognition-on-common-voice-7-0-irish', 'speech-recognition-on-common-voice-8-0-irish', 'speech-recognition-on-common-voice-2', 'speech-recognition-on-common-voice-7-0-3', 'speech-recognition-on-common-voice-8-0-german', 'speech-recognition-on-common-voice-8-0-6', 'speech-recognition-on-common-voice-7-0-4', 'speech-recognition-on-common-voice-7-0-13', 'speech-recognition-on-common-voice-8-0-37', 'speech-recognition-on-common-voice-8-0-22', 'speech-recognition-on-common-voice-8-0', 'speech-recognition-on-common-voice-frisian', 'speech-recognition-on-common-voice-8-0-4', 'speech-recognition-on-common-voice-italian', 'speech-recognition-on-common-voice-8-0-french', 'speech-recognition-on-common-voice-english', 'speech-recognition-on-common-voice-8-0-hindi', 'speech-recognition-on-common-voice-7-0-5', 'speech-recognition-on-common-voice-7-0-hindi', 'speech-recognition-on-common-voice-8-0-dutch', 'speech-recognition-on-common-voice-spanish', 'speech-recognition-on-common-voice-french', 'speech-recognition-on-common-voice-german'],
    'ComplexWebQuestions': ['knowledge-base-question-answering-on'],
    'CrossNER': ['zero-shot-named-entity-recognition-ner-on-1'],
    'CrowS-Pairs': ['stereotypical-bias-analysis-on-crows-pairs'],
    'DROP': ['question-answering-on-drop-test', 'question-answering-on-drop'],
    'DiDeMo': ['video-retrieval-on-didemo', 'zero-shot-video-retrieval-on-didemo'],
    'DocVQA': ['visual-question-answering-on-docvqa-test'],
    'FLEURS': ['automatic-speech-recognition-on-fleurs-1'],
    'FSD50K': ['audio-classification-on-fsd50k'],
    'FewCLUE': ['language-modelling-on-fewclue-eprstmt', 'language-modelling-on-fewclue-ocnli-fc', 'language-modelling-on-fewclue-bustm', 'language-modelling-on-fewclue-chid-fc', 'language-modelling-on-fewclue-cluewsc-fc'],
    'FinQA': ['question-answering-on-finqa'],
    'FineAction': ['temporal-action-localization-on-fineaction'],
    'Flickr30K': ['zero-shot-cross-modal-retrieval-on-flickr30k', 'image-to-text-retrieval-on-flickr30k'],
    'Food-101': ['zero-shot-transfer-image-classification-on-17'],
    'GEM': ['extreme-summarization-on-gem-xsum'],
    'GENIA': ['named-entity-recognition-on-genia'],
    'GQA': ['visual-question-answering-on-gqa-test-dev'],
    'GSM8K': ['arithmetic-reasoning-on-gsm8k'],
    'HIV': ['molecular-property-prediction-on-hiv-dataset'],
    'HMDB51': ['action-recognition-in-videos-on-hmdb-51', 'zero-shot-action-recognition-on-hmdb51'],
    'HallusionBench': ['visual-question-answering-vqa-on-3'],
    'HellaSwag': ['sentence-completion-on-hellaswag'],
    'HumanEval': ['code-generation-on-humaneval'],
    'IFEval': ['instruction-following-on-ifeval'],
    'IUPAC': ['iupac-name-prediction-on-iupac'],
    'ImageNet': ['few-shot-image-classification-on-imagenet-10', 'few-shot-image-classification-on-imagenet-1-1', 'few-shot-image-classification-on-imagenet-5', 'image-classification-on-imagenet', 'self-supervised-image-classification-on', 'self-supervised-image-classification-on-1', 'zero-shot-transfer-image-classification-on-1', 'zero-shot-transfer-image-classification-on-3'],
    'InfoSeek': ['visual-question-answering-vqa-on-infoseek'],
    'InfographicVQA': ['visual-question-answering-vqa-on'],
    'JFT-300M': ['image-classification-on-jft-300m'],
    'Kinetics': ['action-classification-on-kinetics-400', 'action-classification-on-kinetics-600', 'action-classification-on-kinetics-700', 'spatio-temporal-action-localization-on-ava', 'video-generation-on-kinetics-600-12-frames', 'zero-shot-action-recognition-on-kinetics'],
    'LAMBADA': ['language-modelling-on-lambada'],
    'LLaVA-Bench': ['visual-instruction-following-on-llava-bench'],
    'LibriSpeech': ['speech-recognition-on-librispeech-test-clean', 'speech-recognition-on-librispeech-test-other'],
    'MATH': ['math-word-problem-solving-on-math'],
    'MAWPS': ['math-word-problem-solving-on-mawps'],
    'MBPP': ['code-generation-on-mbpp'],
    'MGSM': ['multi-task-language-understanding-on-mgsm'],
    'MM-Vet': ['visual-question-answering-on-mm-vet'],
    'MMLU': ['multi-task-language-understanding-on-mmlu', 'mathematical-reasoning-on-mmlu-mathematics', 'multiple-choice-question-answering-mcqa-on-11', 'multiple-choice-question-answering-mcqa-on-8', 'multiple-choice-question-answering-mcqa-on-25', 'multiple-choice-question-answering-mcqa-on-7', 'multiple-choice-question-answering-mcqa-on-9', 'multiple-choice-question-answering-mcqa-on-10', 'multiple-choice-question-answering-mcqa-on-13', 'multiple-choice-question-answering-mcqa-on-12', 'multiple-choice-question-answering-mcqa-on-2', 'multiple-choice-question-answering-mcqa-on-3', 'multiple-choice-question-answering-mcqa-on-4', 'multiple-choice-question-answering-mcqa-on-5', 'multiple-choice-question-answering-mcqa-on-16', 'multiple-choice-question-answering-mcqa-on-17', 'multiple-choice-question-answering-mcqa-on-18', 'multiple-choice-question-answering-mcqa-on-20', 'multiple-choice-question-answering-mcqa-on-14', 'multiple-choice-question-answering-mcqa-on-19', 'multiple-choice-question-answering-mcqa-on-6', 'multiple-choice-question-answering-mcqa-on-15', 'multiple-choice-question-answering-mcqa-on-24', 'multiple-choice-question-answering-mcqa-on-26', 'multiple-choice-question-answering-mcqa-on-23'],
    'MRPC': ['semantic-textual-similarity-on-mrpc'],
    'MSCOCO': ['image-captioning-on-coco', 'image-retrieval-on-coco', 'image-to-text-retrieval-on-coco', 'text-to-image-generation-on-coco', 'zero-shot-cross-modal-retrieval-on-coco-2014'],
    'MSRVTT': ['text-to-video-generation-on-msr-vtt', 'video-captioning-on-msr-vtt-1', 'video-retrieval-on-msr-vtt', 'zero-shot-video-retrieval-on-msr-vtt', 'video-retrieval-on-msr-vtt-1ka'],
    'MSRVTT-QA': ['zeroshot-video-question-answer-on-msrvtt-qa', 'video-question-answering-on-msrvtt-qa', 'visual-question-answering-on-msrvtt-qa-1'],
    'MSVD': ['video-retrieval-on-msvd', 'video-captioning-on-msvd-1', 'zero-shot-video-retrieval-on-msvd'],
    'MSVD-QA': ['zeroshot-video-question-answer-on-msvd-qa', 'zeroshot-video-question-answer-on-msvd-qa'],
    'MathQA': ['math-word-problem-solving-on-mathqa'],
    'MedMCQA': ['multiple-choice-question-answering-mcqa-on-21'],
    'MedQA': ['question-answering-on-medqa-usmle'],
    'MiT': ['action-classification-on-moments-in-time'],
    'MoleculeNet': ['molecular-property-prediction-on-moleculenet'],
    'MultiRC': ['question-answering-on-multirc'],
    'MusicCaps': ['text-to-music-generation-on-musiccaps'],
    'MusicQA': ['music-question-answering-on-musicqa'],
    'NExT-QA': ['temporal-casual-qa-on-next-qa', 'question-answering-on-next-qa-open-ended', 'video-question-answering-on-next-qa', 'zero-shot-video-question-answer-on-next-qa', 'zero-shot-video-question-answer-on-next-gqa'],
    'NLVR': ['visual-reasoning-on-nlvr2-test', 'visual-reasoning-on-nlvr2-dev'],
    'NQ': ['passage-retrieval-on-natural-questions', 'question-answering-on-natural-questions'],
    'NoCaps': ['image-captioning-on-nocaps-entire', 'image-captioning-on-nocaps-near-domain', 'image-captioning-on-nocaps-out-of-domain', 'image-captioning-on-nocaps-in-domain', 'image-captioning-on-nocaps-val-in-domain', 'image-captioning-on-nocaps-val-overall', 'image-captioning-on-nocaps-val-out-domain', 'image-captioning-on-nocaps-val-near-domain'],
    'OK-VQA': ['visual-question-answering-on-ok-vqa'],
    'OVEN': ['fine-grained-image-recognition-on-oven'],
    'OmniBenchmark': ['image-classification-on-omnibenchmark'],
    'OpenbookQA': ['question-answering-on-openbookqa', 'question-answering-on-obqa'],
    'PIQA': ['question-answering-on-piqa'],
    'PMC-VQA': ['generative-visual-question-answering-on-pmc', 'visual-question-answering-vqa-on-pmc-vqa', 'medical-visual-question-answering-on-pmc-vqa'],
    'Pets37': ['fine-grained-image-classification-on-oxford-1'],
    'PubChemQA': ['question-answering-on-pubchemqa'],
    'PubMedQA': ['question-answering-on-pubmedqa'],
    'QNLI': ['natural-language-inference-on-qnli'],
    'RACE': ['reading-comprehension-on-race', 'question-answering-on-race'],
    'RAFT': ['few-shot-text-classification-on-raft'],
    'RTE': ['natural-language-inference-on-rte'],
    'RareAct': ['action-recognition-on-rareact'],
    'ReCoRD': ['common-sense-reasoning-on-record'],
    'RefCOCO': ['referring-expression-comprehension-on-refcoco-1', 'referring-expression-comprehension-on-refcoco-1', 'referring-expression-segmentation-on-refcocog', 'referring-expression-segmentation-on-refcoco', 'referring-expression-comprehension-on-1', 'referring-expression-comprehension-on', 'referring-expression-comprehension-on-refcoco'],
    'Robust (2004)': ['ad-hoc-information-retrieval-on-trec-robust04'],
    'SCROLLS': ['long-range-modeling-on-scrolls'],
    'SICK': ['semantic-textual-similarity-on-sick', 'semantic-textual-similarity-on-sick-r-1'],
    'SIDER': ['molecular-property-prediction-on-sider-1'],
    'SIQA': ['question-answering-on-social-iqa'],     
    'SPGISpeech': ['speech-recognition-on-spgispeech'],
    'SQuAD': ['question-answering-on-squad11-dev'],
    'SST': ['sentiment-analysis-on-sst-2-binary'],
    'STAR': ['video-question-answering-on-situated', 'zero-shot-video-question-answer-on-star', 'zero-shot-video-question-answer-on-star-1'],
    'STS-B': ['semantic-textual-similarity-on-sts-benchmark', 'semantic-textual-similarity-on-sts13', 'semantic-textual-similarity-on-sts14', 'semantic-textual-similarity-on-sts12', 'semantic-textual-similarity-on-sts15', 'semantic-textual-similarity-on-sts16', 'semantic-similarity-on-sts-benchmark'],
    'SVAMP': ['math-word-problem-solving-on-svamp'],
    'SWE-bench': ['bug-fixing-on-swe-bench'],
    'SciQ': ['text-generation-on-sciq'],
    'ScienceQA': ['science-question-answering-on-scienceqa'],
    'Something-Something': ['action-recognition-in-videos-on-something'],
    'Spider': ['text-to-sql-on-spider', 'semantic-parsing-on-spider'],
    'StereoSet': ['bias-detection-on-stereoset-1'],
    'StoryCloze': ['question-answering-on-storycloze'],
    'StrategyQA': ['question-answering-on-strategyqa'],
    'TACRED': ['relation-extraction-on-tacred'],
    'TED-LIUM': ['speech-recognition-on-tedlium'],
    'TGIF-QA': ['tgif-frame-on-tgif-qa', 'zeroshot-video-question-answer-on-tgif-qa', 'zeroshot-video-question-answer-on-tgif-qa-1', 'visual-question-answering-on-tgif-qa'],
    'TREC-COVID': ['zero-shot-text-search-on-trec-covid'],
    'TVQA': ['video-question-answering-on-tvqa', 'zero-shot-video-question-answer-on-tvqa'],
    'TextVQA': ['visual-question-answering-on-textvqa-test-1'],
    'TheoremQA': ['natural-questions-on-theoremqa'],
    'The Pile': ['language-modelling-on-the-pile'],
    'Tox21': ['language-modelling-on-the-pile'],
    'TriviaQA': ['question-answering-on-triviaqa'],
    'TruthfulQA': ['question-answering-on-truthfulqa'],
    'TyDiQA-GoldP': ['cross-lingual-question-answering-on-tydiqa'],
    'UCF101': ['action-recognition-in-videos-on-ucf101', 'self-supervised-action-recognition-on-ucf101', 'text-to-video-generation-on-ucf-101', 'zero-shot-action-recognition-on-ucf101', 'video-generation-on-ucf-101'],
    'UniProtQA': ['question-answering-on-uniprotqa'],
    'VATEX': ['video-retrieval-on-vatex', 'video-captioning-on-vatex-1', 'zero-shot-video-retrieval-on-vatex'],
    'VCR': ['visual-question-answering-on-vcr-q-ar-test', 'visual-question-answering-on-vcr-qa-r-test', 'visual-question-answering-on-vcr-q-a-test'],
    'VGG-Sound': ['audio-classification-on-vggsound'],
    'VNHSGE': ['question-answering-on-vnhsge-english', 'question-answering-on-vnhsge-physics', 'question-answering-on-vnhsge-chemistry', 'question-answering-on-vnhsge-biology', 'question-answering-on-vnhsge-history', 'question-answering-on-vnhsge-geography', 'question-answering-on-vnhsge-literature', 'question-answering-on-vnhsge-mathematics-1', 'question-answering-on-vnhsge-civic'],
    'VQA': ['visual-question-answering-on-vqa-v2-val-1', 'visual-question-answering-on-vqa-v2-test-dev-1', 'visual-question-answering-on-vqa-v2-val', 'visual-question-answering-on-vqa-v2-test-std', 'visual-question-answering-on-vqa-v2-test-dev'],
    'VeRi-776': ['vehicle-re-identification-on-veri-776'],
    'VeRi-Wild': ['vehicle-re-identification-on-veri-wild-small'],
    'ViP-Bench': ['visual-question-answering-on-vip-bench'],
    'VideoInstruct': ['video-based-generative-performance', 'video-based-generative-performance-1', 'video-based-generative-performance-2', 'video-based-generative-performance-3', 'video-based-generative-performance-4', 'video-based-generative-performance-5'],
    'VisDial': ['chat-based-image-retrieval-on-visdial'],
    'VizWiz': ['visual-question-answering-on-vizwiz-2020-vqa'],
    'WHOOPS!': ['explanation-generation-on-whoops', 'image-to-text-retrieval-on-whoops', 'image-captioning-on-whoops', 'visual-question-answering-vqa-on-whoops'],
    'WMT (2014)': ['unsupervised-machine-translation-on-wmt2014-1', 'machine-translation-on-wmt2014-french-english', 'machine-translation-on-wmt2014-english-german', 'unsupervised-machine-translation-on-wmt2014-2', 'machine-translation-on-wmt2014-english-french'],
    'WNLI': ['natural-language-inference-on-wnli'],
    'WSC': ['coreference-resolution-on-winograd-schema'],
    'WebQuestions': ['question-answering-on-webquestions'],
    'WebQuestionsSP': ['knowledge-base-question-answering-on-1', 'semantic-parsing-on-webquestionssp'],
    'WenetSpeech': ['speech-recognition-on-wenetspeech'],
    'WikiText-103': ['language-modelling-on-wikitext-103'],
    'WikiText-2': ['language-modelling-on-wikitext-2'],
    'WinoGrande': ['common-sense-reasoning-on-winogrande'],
    'Winoground': ['visual-reasoning-on-winoground'],
    'XCOPA': ['cross-lingual-transfer-on-xcopa'],
    'XSUM': ['text-summarization-on-x-sum'],
    'YouCook2': ['video-retrieval-on-youcook2', 'video-captioning-on-youcook2', 'zero-shot-video-retrieval-on-youcook2'],
    'iNaturalist': ['long-tail-learning-on-inaturalist-2018', 'image-classification-on-inaturalist-2018'],
    'iVQA': ['video-question-answering-on-ivqa'],
}

# PWC leaderboards are retrieved in https://production-media.paperswithcode.com/about/evaluation-tables.json.gz
dataset_oriented_leaderboards = ['https://www.datacomp.ai/dclm/leaderboard.html', 'https://www.datacomp.ai/dcclip/leaderboard.html', 'https://llm-eval.github.io/pages/leaderboard/advprompt.html#attack-results-view-by-datasets', 'https://huggingface.co/spaces/zhaorui-nb/de-identification-leaderboard']
metric_oriented_leaderboards = ['https://github.com/yuh-zha/AlignScore']
method_oriented_leaderboards = ['https://teddy-xionggz.github.io/MIRAGE', 'https://www.swebench.com', 'https://jykoh.com/vwa', 'https://huggingface.co/spaces/osunlp/TravelPlannerLeaderboard', 'https://huggingface.co/spaces/JetBrains-Research/long-code-arena', 'https://huggingface.co/spaces/OPTML-Group/UnlearnCanvas-Benchmark', 'https://bird-bench.github.io', 'https://huggingface.co/spaces/stabletoolbench/Stable_Tool_Bench_Leaderboard', 'https://huggingface.co/spaces/GPTEval3D/Leaderboard_dev', 'https://huggingface.co/spaces/boyiwei/CoTaEval_leaderboard', 'https://huggingface.co/spaces/locuslab/tofu_leaderboard', 'https://huggingface.co/spaces/Intel/UnlearnDiffAtk-Benchmark', 'https://github.com/svilupp/Julia-LLM-Leaderboard?tab=readme-ov-file#prompting-templates', 'https://llm-eval.github.io/pages/leaderboard/pe.html', 'https://llm-eval.github.io/pages/leaderboard/advprompt.html#all-results-of-prompts', 'https://huggingface.co/spaces/autogenCTF/agent_ctf_leaderboard']
solution_oriented_leaderboards = ['https://eu.aihub.ml/competitions', 'https://aistudio.baidu.com/competition', 'https://www.hilti-challenge.com', 'https://insightface.ai/challenges', 'https://www.aicrowd.com/challenges', 'https://grand-challenge.org/challenges', 'https://dynabench.org/tasks', 'https://www.kaggle.com/competitions', 'https://eval.ai/web/challenges/list', 'https://taostats.io', 'https://artificialanalysis.ai']

In [3]:
platform_abbreviation_mapping_inverse = {v: k for k, v in platform_abbreviation_mapping.items()}

metrics_synonyms_inverse = {}
for key, values in metrics_synonyms.items():
    for value in values:
        metrics_synonyms_inverse[value] = key

publisher_synonyms_inverse = {}
for key, values in publisher_synonyms.items():
    for value in values:
        publisher_synonyms_inverse[value] = key

ranking_dataframe_organization_tactics_mapping_inverse = {}
for key, values in ranking_dataframe_organization_tactics_mapping.items():
    for value in values:
        ranking_dataframe_organization_tactics_mapping_inverse[value] = key

def convert_df_to_dict(df):
    """
    Convert a DataFrame of leaderboards and metrics to a dictionary.

    :param df: DataFrame with leaderboards and metrics
    :return: Dictionary with leaderboards as keys and list of metrics as values
    """
    leaderboard_data = {}

    # Ensure the DataFrame's first column is considered as the keys
    # and iterate through each row to construct the dictionary
    for _, row in df.iterrows():
        key = row[0]  # The first column serves as the key
        # List comprehension to get non-empty values from the rest of the row
        values = [value for value in row[1:] if pd.notna(value)]
        leaderboard_data[key] = values

    return leaderboard_data

def string_to_list(text, platform=False):
    if pd.isna(text) or text == 'nan':
        return []
    elif platform:
        return [platform_abbreviation_mapping[platform] for platform in text.split(',')]
    else:
        return text.split(',')

def string_to_dict(s, platform=False, list_format=False):
    # Check if the input is np.nan
    if pd.isna(s):
        if list_format:
            return []
        return {}
    
    # Split the string into key-value pairs
    pairs = s.split(',')
    result_dict = {}
    result_list = []
    
    for pair in pairs:
        # Split each pair by ':' to separate keys and values
        key, value = pair.split(':')
        # Split the value by '+' to get the list of items
        value_list = value.split('+')
        # Assign the list to the key in the dictionary
        if platform:
            result_dict[platform_abbreviation_mapping[key]] = value_list
        else:
            result_dict[key] = value_list
        result_list.extend(value_list)
            
    if list_format:
        return result_list
    return result_dict

# Function to format each value based on its own decimal places
def format_individual_value(x):
    if isinstance(x, float):
        # Use string formatting to maintain original decimal places
        return "{:f}".format(x).rstrip('0').rstrip('.')
    return x

def print_empty_folders(root_dir):
    for dirpath, dirname, filenames in os.walk(root_dir):
        # Check if both lists of subdirectories and filenames are empty
        if not filenames and dirpath != root_dir:
            print(f"Empty folder: {dirpath}")
            
def list_directories(folder_path):
    # List all subdirectories within the folder
    directories = [os.path.join(folder_path, d) for d in os.listdir(
        folder_path) if os.path.isdir(os.path.join(folder_path, d))]
    return directories

def publisher_synonyms_mapping(publishers):
    publishers_processed = set()
    for publisher in publishers:
        if publisher in publisher_synonyms_inverse:
            publishers_processed.add(publisher_synonyms_inverse[publisher])
        # elif 'Independent Contributor' == publisher:
        #     publishers_processed.add(leaderboard)
        else:
            publishers_processed.add(publisher)
    return publishers_processed

def keep_rows_by_list_column(df, column_name, keyword_list):
    """
    Filters rows in a DataFrame based on whether all elements in a specified list column are in a given keyword list.
    
    Parameters:
    - df: Pandas DataFrame.
    - column_name: The name of the column containing lists of strings.
    - keyword_list: A list of keywords to check against.
    
    Returns:
    - A filtered Pandas DataFrame.
    """
    # Convert the keyword list to a set for faster membership testing
    keyword_set = set(keyword_list)
    
    # Define a lambda function to check if all elements of a list are in the keyword_set
    all_in_keywords = lambda x: any(element in keyword_set for element in x)
    
    # Apply the lambda function to the specified column and invert the boolean Series to filter rows
    filtered_df = df[df[column_name].apply(all_in_keywords)]
    
    return filtered_df

def filter_rows_by_list_column(df, column_name, keyword_list):
    """
    Filters rows in a DataFrame based on whether all elements in a specified list column are in a given keyword list.
    
    Parameters:
    - df: Pandas DataFrame.
    - column_name: The name of the column containing lists of strings.
    - keyword_list: A list of keywords to check against.
    
    Returns:
    - A filtered Pandas DataFrame.
    """
    # Convert the keyword list to a set for faster membership testing
    keyword_set = set(keyword_list)
    
    # Define a lambda function to check if all elements of a list are in the keyword_set
    all_in_keywords = lambda x: not all(element in keyword_set for element in x)
    
    # Apply the lambda function to the specified column and invert the boolean Series to filter rows
    filtered_df = df[df[column_name].apply(all_in_keywords)]
    
    return filtered_df

In [8]:
import subprocess

# Load the environment variables from key.json
with open(f'{path_key}/.sourcegraph.json') as f:
    env_vars = json.load(f)

# Set the environment variables
os.environ.update(env_vars)

# Execute the shell script and pass path_data as an argument
try:
    subprocess.run(['sh', f'{path_data}/Dependents_Lookup.sh', path_data], check=True)
    print("Script executed successfully.")
except subprocess.CalledProcessError as e:
    print(f"Script execution failed with error: {e}")


Script executed successfully.


In [6]:
import json
import webbrowser

with open(f"{path_data}/GitHub.json") as f:
    data = json.load(f)

for index, repo in enumerate(data["Results"]):
    if index <= 179:
        continue
    webbrowser.open(f'https://{repo["name"]}')
    if index % 20 == 19:
        print(index)
        code = input("Press enter key to proceed.")
        if code.lower() == 'esc':
            raise KeyboardInterrupt

199
219
239
259
279
299
319
339
359
379
399
419
439
459
479
499
519
539
559
579
599
619
639
659
679
699
719
739
759
779
799
819
839
859
879
899
919
939
959
979
999
1019
1039
1059
1079
1099
1119
1139
1159
1179
1199
1219
1239
1259
1279
1299
1319
1339
1359
1379
1399
1419
1439
1459
1479
1499
1519
1539
1559
1579
1599
1619
1639
1659
1679
1699
1719
1739
1759
1779
1799
1819
1839
1859
1879
1899
1919
1939
1959
1979
1999
2019
2039
2059
2079
2099
2119
2139
2159
2179
2199
2219
2239
2259
2279
2299
2319
2339
2359
2379
2399
2419


In [None]:
github_leaderboard_primary = [
    {
        'leaderboard': 'https://github.com/ray-project/llmperf-leaderboard',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/vztu/BVQA_Benchmark',
        'reference': 'https://github.com/vztu/RAPIQUE/blob/e637a3d943010940f67ef7b0c19e2f2c81d63b01/README.md?plain=1#L8'
    },
    {
        'leaderboard': 'https://csbench.github.io/#leaderboard',
        'reference': ''
    },
    {
        'leaderboard': 'https://crowdbenchmark.com/nwpucrowd.html',
        'reference': 'https://github.com/gjy3035/NWPU-Crowd-Sample-Code/blob/fe8e986d23e88f7b9defabbd0b3f6f655803152d/README.md?plain=1#L92'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/Decentralised-AI/falcon-40b/blob/6e61c89591cc7a3328d4010ceaf701dfec03fd18/README.md?plain=1#L183'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/instance-segmentation-on-coco',
        'reference': 'https://github.com/IDEA-Research/DINO/blob/d84a491d41898b3befd8294d1cf2614661fc0953/README.md?plain=1#L35'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/panoptic-segmentation-on-coco-test-dev',
        'reference': 'https://github.com/IDEA-Research/DINO/blob/d84a491d41898b3befd8294d1cf2614661fc0953/README.md?plain=1#L35'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/semantic-segmentation-on-ade20k',
        'reference': 'https://github.com/IDEA-Research/DINO/blob/d84a491d41898b3befd8294d1cf2614661fc0953/README.md?plain=1#L35'
    },
    {
        'leaderboard': 'https://github.com/kaz-Anova/ensemble_amazon',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/MLBazaar/BTB',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/Codium-ai/AlphaCodium',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.nuscenes.org/object-detection',
        'reference': 'https://github.com/VDIGPKU/HENet/blob/main/README.md?plain=1#L13'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/bigcode/bigcode-models-leaderboard',
        'reference': 'https://github.com/continuedev/what-llm-to-use/blob/main/README.md?plain=1#L39'
    },
    {
        'leaderboard': 'https://wilds.stanford.edu/leaderboard',
        'reference': 'https://github.com/LFhase/PAIR/blob/main/README.md?plain=1#L19'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/dsdanielpark/open-llm-datasets'
    },
    {
        'leaderboard': 'https://github.com/niais/Awesome-Skeleton-based-Action-Recognition',
        'reference': ''
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/2210/leaderboard',
        'reference': 'https://github.com/yanconglin/ICP-Flow/blob/main/README.md?plain=1#L90'
    },
    {
        'leaderboard': 'https://rajpurkar.github.io/SQuAD-explorer',
        'reference': 'https://github.com/zihangdai/xlnet/blob/master/README.md?plain=1#L35'
    },
    {
        'leaderboard': 'https://cmedbenchmark.llmzoo.com/static/leaderboard.html',
        'reference': 'https://github.com/X-D-Lab/Sunsimiao/blob/master/README.md?plain=1#L82'
    },
    {
        'leaderboard': 'https://ogb.stanford.edu/docs/lsc/leaderboards',
        'reference': 'https://github.com/lmqfly/Geometry-Deep-Learning-for-Drug-Discovery/blob/main/README.md?plain=1#L104'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1832/leaderboard',
        'reference': 'https://github.com/goel-shashank/CyCLIP/blob/main/README.md?plain=1#L82'
    },
    {
        'leaderboard': 'https://www.cvlibs.net/datasets/kitti/eval_object.php',
        'reference': 'https://github.com/fregu856/3DOD_thesis/blob/master/README.md?plain=1#L616'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/ryoungj/ObsScaling/blob/main/README.md?plain=1#L19'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/adithya-s-k/indic_eval/blob/main/README.md?plain=1#L544'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/Cognitive-Lab/indic_llm_leaderboard',
        'reference': 'https://github.com/adithya-s-k/indic_eval/blob/main/README.md?plain=1#L12'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/arjunbansal/awesome-oss-llm-ift-rlhf/blob/main/README.md?plain=1#L51'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/lmsys/chatbot-arena-leaderboard',
        'reference': 'https://github.com/arjunbansal/awesome-oss-llm-ift-rlhf/blob/main/README.md?plain=1#L52'
    },
    {
        'leaderboard': 'https://orionlab.space.noa.gr/mesogeos',
        'reference': 'https://github.com/Orion-AI-Lab/mesogeos/blob/main/README.md?plain=1#L161'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/allstate-claims-severity/leaderboard',
        'reference': 'https://github.com/adornes/spark_python_ml_examples/blob/master/README.md?plain=1#L262'
    },
    {
        'leaderboard': 'https://github.com/salesforce/WikiSQL',
        'reference': ''
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/17640',
        'reference': 'https://github.com/caiyuanhao1998/Retinexformer/blob/master/README.md?plain=1#L111'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/356/leaderboard',
        'reference': 'https://github.com/MCG-NJU/SparseBEV/blob/main/README.md?plain=1#L22'
    },
    {
        'leaderboard': 'https://github.com/longvideobench/LongVideoBench',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/crowdAI/crowdai-musical-genre-recognition-starter-kit',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/yule-BUAA/MergeLM/blob/main/README.md?plain=1#L16'
    },
    {
        'leaderboard': 'https://github.com/DetectionTeamUCAS/RRPN_Faster-RCNN_Tensorflow',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/OpenGVLab/MM-NIAH',
        'reference': ''
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/nycc-matching',
        'reference': 'https://github.com/jmhessel/caption_contest_corpus/blob/main/README.md?plain=1#L109'
    },
    {
        'leaderboard': 'https://microsoft.github.io/MSMARCO-Passage-Ranking-Submissions/leaderboard',
        'reference': 'https://github.com/AlibabaResearch/HLATR/blob/main/readme.md?plain=1#L12'
    },
    {
        'leaderboard': 'https://dki-lab.github.io/GrailQA',
        'reference': 'https://github.com/dki-lab/GrailQA/blob/main/README.md?plain=1#L11'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/mengdi-li/awesome-RLAIF/blob/main/README.md?plain=1#L59'
    },
    {
        'leaderboard': 'https://github.com/SilongYong/SQA3D',
        'reference': ''
    },
    {
        'leaderboard': 'http://host.robots.ox.ac.uk:8080/leaderboard/displaylb.php?challengeid=11&compid=6',
        'reference': 'https://github.com/kjw0612/awesome-deep-vision/blob/master/README.md?plain=1#L171'
    },
    {
        'leaderboard': 'https://github.com/cathyxl/MAgIC',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/JasonForJoy/Leaderboards-for-Multi-Turn-Response-Selection',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/openai/gym/wiki/Leaderboard',
        'reference': 'https://github.com/pat-coady/trpo/blob/master/README.md?plain=1#L9'
    },
    {
        'leaderboard': 'https://paperswithcode.com/dataset/pascalvoc-sp',
        'reference': 'https://github.com/vijaydwivedi75/lrgb/blob/main/README.md?plain=1#L111'
    },
    {
        'leaderboard': 'http://host.robots.ox.ac.uk:8080/leaderboard/displaylb.php?challengeid=11&compid=3',
        'reference': 'https://github.com/SHI-Labs/GFR-DSOD/blob/master/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://github.com/OpenMOSS/HalluQA',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/Spico197/Humback/blob/main/README.md?plain=1#L122'
    },
    {
        'leaderboard': 'https://lmarena.ai',
        'reference': 'https://github.com/ikaijua/Awesome-AITools/blob/main/README.md?plain=1#L109'
    },
    {
        'leaderboard': 'https://artificialanalysis.ai/leaderboards/models',
        'reference': 'https://github.com/ikaijua/Awesome-AITools/blob/main/README.md?plain=1#L110'
    },
    {
        'leaderboard': 'https://artificialanalysis.ai/leaderboards/providers',
        'reference': 'https://github.com/ikaijua/Awesome-AITools/blob/main/README.md?plain=1#L110'
    },
    {
        'leaderboard': 'https://artificialanalysis.ai/text-to-image',
        'reference': 'https://github.com/ikaijua/Awesome-AITools/blob/main/README.md?plain=1#L110'
    },
    {
        'leaderboard': 'https://artificialanalysis.ai/speech-to-text',
        'reference': 'https://github.com/ikaijua/Awesome-AITools/blob/main/README.md?plain=1#L110'
    },
    {
        'leaderboard': 'https://artificialanalysis.ai/text-to-speech',
        'reference': 'https://github.com/ikaijua/Awesome-AITools/blob/main/README.md?plain=1#L110'
    },
    {
        'leaderboard': 'https://mcgill-nlp.github.io/bias-bench',
        'reference': 'https://github.com/McGill-NLP/bias-bench/blob/main/README.md?plain=1#L9'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/visual-question-answering-on-mm-vet',
        'reference': 'https://github.com/yuweihao/MM-Vet/blob/main/README.md?plain=1#L30'
    },
    {
        'leaderboard': 'https://github.com/THUDM/AgentBench',
        'reference': ''
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/winogrande',
        'reference': 'https://github.com/allenai/winogrande/blob/master/README.md?plain=1#L21'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/tianyi-lab/Reflection_Tuning/blob/main/README.md?plain=1#L203'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/tianyi-lab/Reflection_Tuning/blob/main/README.md?plain=1#L203'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/tianyi-lab/Reflection_Tuning/blob/main/README.md?plain=1#L203'
    },
    {
        'leaderboard': 'https://dynabench.org/tasks',
        'reference': 'https://github.com/eugenesiow/practical-ml/blob/master/README.md?plain=1#L78'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/9304',
        'reference': 'https://github.com/huzeyann/MemoryEncodingModel/blob/main/README.md?plain=1#L15'
    },
    {
        'leaderboard': 'https://box.vicos.si/borja/viamaro/index.html#leaderboard',
        'reference': 'https://github.com/bborja/modd/blob/master/README.md?plain=1#L150'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/ntut-ml-2018-computer-vision/leaderboard',
        'reference': 'https://github.com/hsuRush/DeepANPR/blob/master/README.md?plain=1#L2'
    },
    {
        'leaderboard': 'https://github.com/XuanwuAI/SecEval',
        'reference': ''
    },
    {
        'leaderboard': 'https://few-shot.yyliu.net/miniimagenet.html',
        'reference': 'https://github.com/indussky8/awesome-few-shot-learning/blob/main/README.md?plain=1#L279'
    },
    {
        'leaderboard': 'https://github.com/iarai/NeurIPS2022-traffic4cast',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/cvgroup-njust/CityPersons',
        'reference': ''
    },
    {
        'leaderboard': 'https://ymcui.com/cmrc2019',
        'reference': 'https://github.com/ymcui/cmrc2019/blob/master/README.md?plain=1#L22'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/fungi-challenge-fgvc-2018/leaderboard',
        'reference': 'https://github.com/visipedia/fgvcx_fungi_comp/blob/master/README.md?plain=1#L10'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1091/leaderboard',
        'reference': 'https://github.com/Raldir/FEVEROUS/blob/main/README.md?plain=1#L171'
    },
    {
        'leaderboard': 'https://rajpurkar.github.io/SQuAD-explorer',
        'reference': 'https://github.com/google-research/bert/blob/master/README.md?plain=1#L194'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/siim-isic-melanoma-classification/leaderboard',
        'reference': 'https://github.com/haqishen/SIIM-ISIC-Melanoma-Classification-1st-Place-Solution/blob/master/README.md?plain=1#L3'
    },
    {
        'leaderboard': 'https://cocodataset.org/#stuff-leaderboard',
        'reference': 'https://github.com/nightrome/cocostuff/blob/master/README.md?plain=1#L102'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/WeOpenML/PandaLM/blob/main/README.md?plain=1#L52'
    },
    {
        'leaderboard': 'https://github.com/tianyi-lab/HallusionBench',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/uclaml/SPIN/blob/main/README.md?plain=1#L247'
    },
    {
        'leaderboard': 'https://github.com/mlfoundations/dclm',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.boreas.utias.utoronto.ca/#/leaderboard',
        'reference': 'https://github.com/utiasASRL/hero_radar_odometry/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/880',
        'reference': 'https://github.com/isaaccorley/dfc2022-baseline/blob/master/README.md?plain=1#L34'
    },
    {
        'leaderboard': 'https://haitianliu22.github.io/code-scope-benchmark/leaderboard.html',
        'reference': 'https://github.com/WeixiangYAN/CodeScope/blob/main/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://github.com/databricks/databricks-ml-examples',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/OpenBMB/OlympiadBench',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/AIR-Bench/AIR-Bench',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/decis-bench/febench',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/decis-bench/febench',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.cvlibs.net/datasets/kitti/eval_object.php',
        'reference': 'https://github.com/dashidhy/awesome-point-cloud-deep-learning/blob/master/README.md?plain=1#L60'
    },
    {
        'leaderboard': 'https://www.nuscenes.org/object-detection',
        'reference': 'https://github.com/dashidhy/awesome-point-cloud-deep-learning/blob/master/README.md?plain=1#L61'
    },
    {
        'leaderboard': 'https://github.com/DetectionTeamUCAS/R2CNN-Plus-Plus_Tensorflow',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/diffbot/knowledge-net',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/mlabonne/llm-course/blob/main/README.md?plain=1#L254'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/lmsys/chatbot-arena-leaderboard',
        'reference': 'https://github.com/mlabonne/llm-course/blob/main/README.md?plain=1#L262'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/argilla-io/notus/blob/main/README.md?plain=1#L10'
    },
    {
        'leaderboard': 'https://kgqa.github.io/leaderboard',
        'reference': 'https://github.com/KGQA/leaderboard'
    },
    {
        'leaderboard': 'https://github.com/open-compass/T-Eval',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/KevinLiao159/Quora',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/inspire-group/patch-defense-leaderboard',
        'reference': 'https://github.com/inspire-group/adv-patch-paper-list/blob/main/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://github.com/dynamic-superb/dynamic-superb',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/yizhen20133868/Awesome-TOD-NLG-Survey',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/oshizo/japanese-llm-roleplay-benchmark',
        'reference': ''
    },
    {
        'leaderboard': 'https://waymo.com/open/challenges/2023/motion-prediction',
        'reference': 'https://github.com/zhejz/TrafficBots/blob/main/README.md?plain=1#L51'
    },
    {
        'leaderboard': 'https://paperswithcode.com/dataset/burst',
        'reference': 'https://github.com/Ali2500/BURST-benchmark/blob/main/README.md?plain=1#L112'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/video-super-resolution-on-vid4-4x-upscaling',
        'reference': 'https://github.com/amanchadha/iSeeBetter/blob/master/README.md?plain=1#L19'
    },
    {
        'leaderboard': 'https://github.com/princeton-nlp/LM-Science-Tutor',
        'reference': ''
    },
    {
        'leaderboard': 'https://gluebenchmark.com/leaderboard',
        'reference': 'https://github.com/mwaskom/seaborn-data/blob/master/README.md?plain=1#L26'
    },
    {
        'leaderboard': 'https://lmarena.ai',
        'reference': 'https://github.com/lm-sys/FastChat/blob/main/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://github.com/google-research/meta-dataset',
        'reference': ''
    },
    {
        'leaderboard': 'https://stanfordmlgroup.github.io/competitions/chexpert',
        'reference': 'https://github.com/stanfordmlgroup/MoCo-CXR/blob/main/README.md?plain=1#L71'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/relation-extraction-on-redocred',
        'reference': 'https://github.com/tonytan48/KD-DocRE/blob/main/README.md?plain=1#L8'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1881/leaderboard',
        'reference': 'https://github.com/project-miracl/miracl/blob/main/README.md?plain=1#L23'
    },
    {
        'leaderboard': 'https://fudanselab-classeval.github.io/leaderboard.html',
        'reference': 'https://github.com/FudanSELab/ClassEval/blob/master/README.md?plain=1#L5'
    },
    {
        'leaderboard': 'http://noisylabels.com',
        'reference': 'https://github.com/weijiaheng/Advances-in-Label-Noise-Learning/blob/main/README.md?plain=1#L63'
    },
    {
        'leaderboard': 'https://paperswithcode.com/dataset/animal',
        'reference': 'https://github.com/weijiaheng/Advances-in-Label-Noise-Learning/blob/main/README.md?plain=1#L67'
    },
    {
        'leaderboard': 'https://paperswithcode.com/dataset/clothing1m',
        'reference': 'https://github.com/weijiaheng/Advances-in-Label-Noise-Learning/blob/main/README.md?plain=1#L69'
    },
    {
        'leaderboard': 'https://yale-lily.github.io/sparc',
        'reference': 'https://github.com/taoyds/sparc/blob/master/README.md?plain=1#L3'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/machine-translation-on-wmt2014-german-english',
        'reference': 'https://github.com/joeynmt/joeynmt/blob/main/README.md?plain=1#L280'
    },
    {
        'leaderboard': 'https://github.com/hendrycks/robustness',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/huguyuehuhu/Awesome-Group-Activity-Recognition',
        'reference': ''
    },
    {
        'leaderboard': 'https://mmcheng.net/videosal',
        'reference': 'https://github.com/MichiganCOG/TASED-Net/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://pmc-patients.github.io',
        'reference': 'https://github.com/pmc-patients/pmc-patients/blob/main/README.md?plain=1#L104'
    },
    {
        'leaderboard': 'https://github.com/Xiangyu-CAS/AICity2020-VOC-ReID',
        'reference': ''
    },
    {
        'leaderboard': 'https://agora-evaluation.is.tuebingen.mpg.de',
        'reference': 'https://github.com/IDEA-Research/OSX/blob/main/README.md?plain=1#L41'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/robust-camera-only-3d-object-detection-on',
        'reference': 'https://github.com/Daniel-xsy/RoboBEV/blob/master/README.md?plain=1#L90'
    },
    {
        'leaderboard': 'https://waymo.com/open/challenges',
        'reference': 'https://github.com/Nightmare-n/GD-MAE/blob/main/README.md?plain=1#L12'
    },
    {
        'leaderboard': 'https://github.com/GAIR-NLP/auto-j',
        'reference': ''
    },
    {
        'leaderboard': 'https://zjysteven.github.io/OpenOOD/#leaderboard',
        'reference': 'https://github.com/Jingkang50/OpenOOD/blob/main/README.md?plain=1#L57'
    },
    {
        'leaderboard': 'https://webots.cloud/competition',
        'reference': 'https://github.com/cyberbotics/wrestling/blob/main/README.md?plain=1#L79'
    },
    {
        'leaderboard': 'https://github.com/TellinaTool/nl2bash',
        'reference': ''
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota',
        'reference': 'https://github.com/paperswithcode/releasing-research-code/blob/master/README.md?plain=1#L94'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/list',
        'reference': 'https://github.com/paperswithcode/releasing-research-code/blob/master/README.md?plain=1#L96'
    },
    {
        'leaderboard': 'https://nlpprogress.com',
        'reference': 'https://github.com/paperswithcode/releasing-research-code/blob/master/README.md?plain=1#L97'
    },
    {
        'leaderboard': 'https://github.com/SUFE-AIFLM-Lab/FinEval',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/FuxiaoLiu/LRV-Instruction',
        'reference': ''
    },
    {
        'leaderboard': 'https://scandeval.com',
        'reference': 'https://github.com/BramVanroy/fietje-2/blob/main/README.md?plain=1#L32'
    },
    {
        'leaderboard': 'https://github.com/JasonForJoy/Leaderboards-for-Multi-Turn-Response-Selection',
        'reference': 'https://github.com/chauff/conversationalIR/blob/master/README.md?plain=1#L75'
    },
    {
        'leaderboard': 'https://paperswithcode.com/task/conversational-response-selection',
        'reference': 'https://github.com/chauff/conversationalIR/blob/master/README.md?plain=1#L77'
    },
    {
        'leaderboard': 'https://multi-trust.github.io/#leaderboard',
        'reference': 'https://github.com/thu-ml/MMTrustEval/blob/main/README.md?plain=1#L11'
    },
    {
        'leaderboard': 'https://www.cluebenchmarks.com/nli.html',
        'reference': 'https://github.com/CLUEbenchmark/OCNLI/blob/main/README.md?plain=1#L59'
    },
    {
        'leaderboard': 'https://github.com/princeton-nlp/CharXiv',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/TIGER-Lab/LongICL-Leaderboard',
        'reference': 'https://github.com/TIGER-AI-Lab/LongICLBench/blob/main/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://github.com/CLUEbenchmark/CLUE',
        'reference': 'https://github.com/shibing624/pytextclassifier/blob/master/README.md?plain=1#L549'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/drop',
        'reference': 'https://github.com/llamazing/numnet_plus/blob/master/README.md?plain=1#L3'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/MLGroupJLU/LLM-eval-survey/blob/main/README.md?plain=1#L343'
    },
    {
        'leaderboard': 'https://agora-evaluation.is.tuebingen.mpg.de',
        'reference': 'https://github.com/ttxskk/AiOS/blob/main/README.md?plain=1#L288'
    },
    {
        'leaderboard': 'https://www.nuscenes.org/object-detection',
        'reference': 'https://github.com/HorizonRobotics/Sparse4D/blob/main/README.md?plain=1#L59'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/163/leaderboard',
        'reference': 'https://github.com/airsplay/lxmert/blob/master/README.md?plain=1#L132'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/225/leaderboard',
        'reference': 'https://github.com/airsplay/lxmert/blob/master/README.md?plain=1#L216'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/225/leaderboard',
        'reference': 'https://github.com/airsplay/lxmert/blob/master/README.md?plain=1#L216'
    },
    {
        'leaderboard': 'https://lil.nlp.cornell.edu/nlvr',
        'reference': 'https://github.com/airsplay/lxmert/blob/master/README.md?plain=1#L271'
    },
    {
        'leaderboard': 'https://evalplus.github.io/leaderboard.html',
        'reference': 'https://github.com/ise-uiuc/magicoder/blob/main/README.md?plain=1#L38'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/mteb/leaderboard',
        'reference': 'https://github.com/qdrant/fastembed/blob/main/README.md?plain=1#L5'
    },
    {
        'leaderboard': 'https://leaderboard.tabbyml.com',
        'reference': 'https://github.com/deepseek-ai/awesome-deepseek-coder/blob/main/README.md?plain=1#L49'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/merveenoyan/awesome-osml-for-devs/blob/main/README.md?plain=1#L130'
    },
    {
        'leaderboard': 'https://mixeval.github.io/#leaderboard',
        'reference': 'https://github.com/Psycoy/MixEval/blob/main/README.md?plain=1#L4'
    },
    {
        'leaderboard': 'https://github.com/BAAI-DCAI/Multimodal-Robustness-Benchmark',
        'reference': ''
    },
    {
        'leaderboard': 'https://vlue-benchmark.github.io/leaderboard.html',
        'reference': 'https://github.com/MichaelZhouwang/VLUE/blob/main/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://www.nuscenes.org/object-detection',
        'reference': 'https://github.com/hht1996ok/EA-LSS/blob/main/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://github.com/ZaloAI-Jaist/VMLU',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/hkust-nlp/ceval',
        'reference': 'https://github.com/NicholasCao/Awesome-Chinese-ChatGPT/blob/main/README.md?plain=1#L24'
    },
    {
        'leaderboard': 'https://lmarena.ai',
        'reference': 'https://github.com/NicholasCao/Awesome-Chinese-ChatGPT/blob/main/README.md?plain=1#L25'
    },
    {
        'leaderboard': 'https://www.superclueai.com',
        'reference': 'https://github.com/NicholasCao/Awesome-Chinese-ChatGPT/blob/main/README.md?plain=1#L26'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/NicholasCao/Awesome-Chinese-ChatGPT/blob/main/README.md?plain=1#L27'
    },
    {
        'leaderboard': 'https://github.com/wangxw5/wikiDiverse',
        'reference': ''
    },
    {
        'leaderboard': 'https://csgaobb.github.io/Projects/mscoco-fsod.html',
        'reference': 'https://github.com/gaobb/Few-Shot-Object-Detection-Papers/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://csgaobb.github.io/Projects/pascalvoc-fsod.html',
        'reference': 'https://github.com/gaobb/Few-Shot-Object-Detection-Papers/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://superbbenchmark.org/leaderboard',
        'reference': 'https://github.com/sungnyun/ARMHuBERT/blob/master/README.md?plain=1#L26'
    },
    {
        'leaderboard': 'https://github.com/THUDM/LongBench',
        'reference': 'https://github.com/DAMO-NLP-SG/CLEX/blob/main/README.md?plain=1#L162'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/lmsys/chatbot-arena-leaderboard',
        'reference': 'https://github.com/leobeeson/llm_benchmarks/blob/master/README.md?plain=1#L316'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/leobeeson/llm_benchmarks/blob/master/README.md?plain=1#L348'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/leobeeson/llm_benchmarks/blob/master/README.md?plain=1#L348'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/long-context-understanding-on-mmneedle',
        'reference': 'https://github.com/Wang-ML-Lab/multimodal-needle-in-a-haystack/blob/main/README.md?plain=1#L14'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/unsupervised-domain-adaptation-on-ucf-hmdb',
        'reference': 'https://github.com/ldkong1205/TranSVAE/blob/main/README.md?plain=1#L67'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/unsupervised-domain-adaptation-on-jester',
        'reference': 'https://github.com/ldkong1205/TranSVAE/blob/main/README.md?plain=1#L67'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/unsupervised-domain-adaptation-on-epic',
        'reference': 'https://github.com/ldkong1205/TranSVAE/blob/main/README.md?plain=1#L67'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/chenking2020/FindTheChatGPTer/blob/main/README.md?plain=1#L539'
    },
    {
        'leaderboard': 'https://cevalbenchmark.com/static/leaderboard.html',
        'reference': 'https://github.com/chenking2020/FindTheChatGPTer/blob/main/README.md?plain=1#L549'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/mslr-ms2',
        'reference': 'https://github.com/allenai/ms2/blob/master/README.md?plain=1#L3'
    },
    {
        'leaderboard': 'https://github.com/insikk/CBIR_LeaderBoard',
        'reference': 'https://github.com/keloli/CBIR_EXPLORE/blob/master/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://github.com/opstower-ai/devops-ai-open-leaderboard',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.cvlibs.net/datasets/kitti',
        'reference': 'https://github.com/SeasonDepth/SeasonDepth/blob/master/README.md?plain=1#L2'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/yangjianxin1/Firefly-LLaMA2-Chinese/blob/master/README.MD?plain=1#L85'
    },
    {
        'leaderboard': 'https://github.com/haonan-li/CMMLU',
        'reference': 'https://github.com/yangjianxin1/Firefly-LLaMA2-Chinese/blob/master/README.MD?plain=1#L112'
    },
    {
        'leaderboard': 'https://open-compass.github.io/T-Eval/leaderboard.html',
        'reference': 'https://github.com/tjtanaa/awesome-large-action-model/blob/main/README.md?plain=1#L20'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/bigcode/bigcode-models-leaderboard',
        'reference': 'https://github.com/codefuse-ai/MFTCoder/blob/main/README.md?plain=1#L55'
    },
    {
        'leaderboard': 'http://host.robots.ox.ac.uk:8080/leaderboard/displaylb.php?challengeid=11&compid=4',
        'reference': 'https://github.com/Smorodov/Deep-learning-object-detection-links./blob/master/readme.md?plain=1#L31'
    },
    {
        'leaderboard': 'https://github.com/talk2car/Talk2Car',
        'reference': ''
    },
    {
        'leaderboard': 'https://atlas-challenge.u-bourgogne.fr/leaderboard',
        'reference': 'https://github.com/uni-medical/STU-Net/blob/main/README.md?plain=1#L11'
    },
    {
        'leaderboard': 'https://sppin.grand-challenge.org/evaluation/final-test-phase/leaderboard',
        'reference': 'https://github.com/uni-medical/STU-Net/blob/main/README.md?plain=1#L12'
    },
    {
        'leaderboard': 'https://autopet-ii.grand-challenge.org/leaderboard',
        'reference': 'https://github.com/uni-medical/STU-Net/blob/main/README.md?plain=1#L13'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/12239',
        'reference': 'https://github.com/uni-medical/STU-Net/blob/main/README.md?plain=1#L14'
    },
    {
        'leaderboard': 'https://github.com/hkust-nlp/ceval',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard',
        'reference': 'https://github.com/ruanchaves/napolab/blob/main/README.md?plain=1#L16'
    },
    {
        'leaderboard': 'https://github.com/Instance-Search/Instance-Search',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/LudwigStumpp/llm-leaderboard',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/bigcode/bigcode-models-leaderboard',
        'reference': 'https://github.com/bigcode-project/bigcode-evaluation-harness/blob/leaderboard/leaderboard/README.md?plain=1#L11'
    },
    {
        'leaderboard': 'https://github.com/awslabs/diagnostic-robustness-text-to-sql',
        'reference': ''
    },
    {
        'leaderboard': 'https://openlamm.github.io/ch3ef/leaderboard.html',
        'reference': 'https://github.com/OpenGVLab/LAMM/blob/main/README.md?plain=1#L15'
    },
    {
        'leaderboard': 'https://visualcommonsense.com/leaderboard',
        'reference': 'https://github.com/ict-bigdatalab/awesome-pretrained-models-for-information-retrieval/blob/main/README.md?plain=1#L513'
    },
    {
        'leaderboard': 'https://stanfordmlgroup.github.io/competitions/mrnet',
        'reference': 'https://github.com/MisaOgura/MRNet/blob/master/README.md?plain=1#L278'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/GPT-Alternatives/gpt_alternatives/blob/main/README.md?plain=1#L271'
    },
    {
        'leaderboard': 'https://github.com/salesforce/localization-xml-mt',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/ldkong1205/PointCloud-C',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/AsuradaYuci/awesome_video_person_reid/blob/master/leaderboard.md',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/THUDM/ChatGLM-Math',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/LMMMEng/LLD-MMRI2023/blob/main/assets/test_leaderboard.md',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/jianguoz/Few-Shot-Intent-Detection',
        'reference': ''
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1256/leaderboard',
        'reference': 'https://github.com/neurallatents/nlb_tools/blob/main/README.md?plain=1#L35'
    },
    {
        'leaderboard': 'https://www.aicrowd.com/challenges/music-demixing-challenge-ismir-2021/leaderboards',
        'reference': 'https://github.com/AIcrowd/music-demixing-challenge-starter-kit/blob/master/README.md?plain=1#L194'
    },
    {
        'leaderboard': 'https://yale-lily.github.io/spider',
        'reference': 'https://github.com/taoyds/spider/blob/master/README.md?plain=1#L3'
    },
    {
        'leaderboard': 'https://www.nist.gov/programs-projects/face-technology-evaluations-frtefate',
        'reference': 'https://github.com/becauseofAI/awesome-face/blob/master/README.md?plain=1#L465'
    },
    {
        'leaderboard': 'https://comma.ai/leaderboard',
        'reference': 'https://github.com/commaai/controls_challenge/blob/master/README.md?plain=1#L8'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/sherlock',
        'reference': 'https://github.com/allenai/sherlock/blob/main/README.md?plain=1#L22'
    },
    {
        'leaderboard': 'https://github.com/michuanhaohao/AICITY2021_Track2_DMT',
        'reference': ''
    },
    {
        'leaderboard': 'https://opendrivelab.com/challenge2023',
        'reference': 'https://github.com/er-muyue/BeMapNet/blob/main/README.md?plain=1#L11'
    },
    {
        'leaderboard': 'http://host.robots.ox.ac.uk/leaderboard/displaylb.php?challengeid=11',
        'reference': 'https://github.com/openaifab/hair/blob/master/README.md?plain=1#L62'
    },
    {
        'leaderboard': 'https://paperswithcode.com/task/image-super-resolution',
        'reference': 'https://github.com/isaaccorley/pytorch-enhance/blob/master/README.md?plain=1#L55'
    },
    {
        'leaderboard': 'http://host.robots.ox.ac.uk:8080/leaderboard/displaylb.php?challengeid=11&compid=6',
        'reference': 'https://github.com/autonomousdrivingkr/Awesome-Autonomous-Driving/blob/master/README.md?plain=1#L143'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/instructkr/ko-chatbot-arena-leaderboard',
        'reference': 'https://github.com/HeegyuKim/open-korean-instructions/blob/main/README.md?plain=1#L73'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/instructkr/LogicKor-leaderboard',
        'reference': 'https://github.com/HeegyuKim/open-korean-instructions/blob/main/README.md?plain=1#L74'
    },
    {
        'leaderboard': 'https://lil.nlp.cornell.edu/nlvr',
        'reference': 'https://github.com/lil-lab/nlvr/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://github.com/cardiffnlp/tweeteval',
        'reference': ''
    },
    {
        'leaderboard': 'https://nealcly.github.io/MuTual-leaderboard',
        'reference': 'https://github.com/Nealcly/MuTual/blob/master/README.md?plain=1#L65'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/imaterialist-challenge-furniture-2018/leaderboard',
        'reference': 'https://github.com/skrypka/imaterialist-furniture-2018/blob/master/README.md?plain=1#L3'
    },
    {
        'leaderboard': 'https://www.nuscenes.org/tracking',
        'reference': 'https://github.com/dvlab-research/VoxelNeXt/blob/master/README.md?plain=1#L21'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/instance-segmentation-on-coco-minival',
        'reference': 'https://github.com/IDEA-Research/DN-DETR/blob/main/README.md?plain=1#L22'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/panoptic-segmentation-on-coco-minival',
        'reference': 'https://github.com/IDEA-Research/DN-DETR/blob/main/README.md?plain=1#L22'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/semantic-segmentation-on-ade20k',
        'reference': 'https://github.com/IDEA-Research/DN-DETR/blob/main/README.md?plain=1#L22'
    },
    {
        'leaderboard': 'https://few-shot.yyliu.net/miniimagenet.html',
        'reference': 'https://github.com/icoz69/DeepEMD/blob/master/README.md?plain=1#L13'
    },
    {
        'leaderboard': 'https://insightface.ai/mfr21',
        'reference': 'https://github.com/deepinsight/insightface/blob/master/README.md?plain=1#L70'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/12599',
        'reference': 'https://github.com/dongkyunk/CheXFusion/blob/main/README.md?plain=1#L27'
    },
    {
        'leaderboard': 'https://github.com/openai/gym/wiki/Leaderboard',
        'reference': 'https://github.com/dgriff777/rl_a3c_pytorch/blob/master/README.MD?plain=1#L22'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/semi-supervised-semantic-segmentation-on-25',
        'reference': 'https://github.com/ldkong1205/LaserMix/blob/main/README.md?plain=1#L73'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/semi-supervised-semantic-segmentation-on-24',
        'reference': 'https://github.com/ldkong1205/LaserMix/blob/main/README.md?plain=1#L73'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/semi-supervised-semantic-segmentation-on-23',
        'reference': 'https://github.com/ldkong1205/LaserMix/blob/main/README.md?plain=1#L73'
    },
    {
        'leaderboard': 'https://paperswithcode.com/paper/lasermix-for-semi-supervised-lidar-semantic',
        'reference': 'https://github.com/ldkong1205/LaserMix/blob/main/README.md?plain=1#L73'
    },
    {
        'leaderboard': 'https://github.com/Coder-Yu/SELFRec',
        'reference': ''
    },
    {
        'leaderboard': 'https://arctic-leaderboard.is.tuebingen.mpg.de/leaderboard',
        'reference': 'https://github.com/zc-alexfan/arctic/blob/master/README.md?plain=1#L44'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/text-to-sql-on-kaggledbqa',
        'reference': 'https://github.com/Chia-Hsuan-Lee/KaggleDBQA/blob/main/README.md?plain=1#L4'
    },
    {
        'leaderboard': 'http://ccl.pku.edu.cn:8084/SpaCE2021/rank',
        'reference': 'https://github.com/2030NLP/SpaCE2021/blob/main/README.md?plain=1#L98'
    },
    {
        'leaderboard': 'http://ccl.pku.edu.cn:8084/SpaCE2021/rank',
        'reference': 'https://github.com/z-fabian/HUMUS-Net/blob/master/README.md?plain=1#L22'
    },
    {
        'leaderboard': 'https://github.com/MinghuiChen43/CIL-ReID',
        'reference': ''
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/yuchenlin/LLM-Blender/blob/main/README.md?plain=1#L346'
    },
    {
        'leaderboard': 'https://github.com/pddasig/Machine-Learning-Competition-2020',
        'reference': ''
    },
    {
        'leaderboard': 'https://yale-lily.github.io/spider',
        'reference': 'https://github.com/BeachWang/DAIL-SQL/blob/main/README.md?plain=1#L4'
    },
    {
        'leaderboard': 'http://got-10k.aitestunion.com/leaderboard',
        'reference': 'https://github.com/wangdongdut/Online-Visual-Tracking-SOTA/blob/master/README.md?plain=1#L116'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/Pan-ML/panml/blob/main/README.md?plain=1#L25'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/Slep/LRVSF-Leaderboard',
        'reference': 'https://github.com/Simon-Lepage/CondViT-LRVSF/blob/main/README.md?plain=1#L28'
    },
    {
        'leaderboard': 'https://mmbench.opencompass.org.cn/leaderboard',
        'reference': 'https://github.com/open-compass/MMBench/blob/main/README.md?plain=1#L26'
    },
    {
        'leaderboard': 'https://github.com/THUDM/VisualAgentBench',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/nyu-cv-fall-2018/leaderboard',
        'reference': 'https://github.com/poojahira/gtsrb-pytorch/blob/master/README.md?plain=1#L5'
    },
    {
        'leaderboard': 'https://github.com/lupantech/PromptPG',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/vidore/vidore-leaderboard',
        'reference': 'https://github.com/illuin-tech/vidore-benchmark/blob/main/README.md?plain=1#L14'
    },
    {
        'leaderboard': 'https://www.kaggle.com/competitions/mlsp-2013-birds/leaderboard',
        'reference': 'https://github.com/gaborfodor/MLSP_2013/blob/master/readme.md?plain=1#L42'
    },
    {
        'leaderboard': 'https://github.com/shjung13/Standardized-max-logits',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/k2-fsa/libriheavy',
        'reference': ''
    },
    {
        'leaderboard': 'http://got-10k.aitestunion.com/leaderboard',
        'reference': 'https://github.com/huanglianghua/siamrpn-pytorch/blob/master/README.md?plain=1#L13'
    },
    {
        'leaderboard': 'https://github.com/Xtra-Computing/NIID-Bench',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/brohrer/parameter_efficiency_leaderboard',
        'reference': ''
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1247/leaderboard',
        'reference': 'https://github.com/SoonminHwang/rgbt-ped-detection/blob/master/README.md?plain=1#L4'
    },
    {
        'leaderboard': 'https://visualcommonsense.com/leaderboard',
        'reference': 'https://github.com/zhegan27/VILLA/blob/main/README.md?plain=1#L130'
    },
    {
        'leaderboard': 'https://microsoft.github.io/AirSim-NeurIPS2019-Drone-Racing/leaderboard_final.html',
        'reference': 'https://github.com/microsoft/AirSim-NeurIPS2019-Drone-Racing/blob/master/README.md?plain=1#L206'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/BestWishYsh/ChronoMagic-Bench',
        'reference': 'https://github.com/yhZhai/mcm/blob/main/README.md?plain=1#L19'
    },
    {
        'leaderboard': 'https://github.com/hemingkx/Spec-Bench/blob/main/Leaderboard.md',
        'reference': ''
    },
    {
        'leaderboard': 'https://open-xai.github.io/leaderboard',
        'reference': 'https://github.com/AI4LIFE-GROUP/OpenXAI/blob/main/README.md?plain=1#L20'
    },
    {
        'leaderboard': 'https://rank.opencompass.org.cn/leaderboard-llm',
        'reference': 'https://github.com/TommyZihao/ChatMarx/blob/main/README.md?plain=1#L129'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/454/leaderboard',
        'reference': 'https://github.com/ZikangZhou/QCNet/blob/main/README.md?plain=1#L9'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1719/leaderboard',
        'reference': 'https://github.com/ZikangZhou/QCNet/blob/main/README.md?plain=1#L10'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/change-point-detection-on-tep',
        'reference': 'https://github.com/YKatser/CPDE/blob/master/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/change-point-detection-on-skab',
        'reference': 'https://github.com/YKatser/CPDE/blob/master/README.md?plain=1#L22'
    },
    {
        'leaderboard': 'https://github.com/ai-forever/digital_peter_aij2020',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/echo840/ocrbench-leaderboard',
        'reference': 'https://github.com/Yuliang-Liu/MultimodalOCR/blob/main/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://leaderboard.sea-lion.ai',
        'reference': 'https://github.com/aisingapore/sealion/blob/main/README.md?plain=1#L81'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/image-harmonization-on-iharmony4',
        'reference': 'https://github.com/bcmi/Awesome-Image-Harmonization/blob/master/README.md?plain=1#L35'
    },
    {
        'leaderboard': 'https://challenge.isic-archive.com/landing/2018',
        'reference': 'https://github.com/ngessert/isic2018/blob/master/README.md?plain=1#L4'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/chujiezheng/LLM-Extrapolation/blob/main/README.md?plain=1#L78'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/chujiezheng/LLM-Extrapolation/blob/main/README.md?plain=1#L80'
    },
    {
        'leaderboard': 'https://aider.chat/docs/leaderboards',
        'reference': 'https://github.com/chujiezheng/LLM-Extrapolation/blob/main/README.md?plain=1#L80'
    },
    {
        'leaderboard': 'https://opening-up-chatgpt.github.io',
        'reference': 'https://github.com/opening-up-chatgpt/opening-up-chatgpt.github.io/blob/main/readme.md?plain=1#L1'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/visualcomet',
        'reference': 'https://github.com/jamespark3922/visual-comet/blob/master/README.md?plain=1#L153'
    },
    {
        'leaderboard': 'https://github.com/StarStyleSky/awesome-face-detection',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/junqiangchen/LiTS---Liver-Tumor-Segmentation-Challenge',
        'reference': ''
    },
    {
        'leaderboard': 'https://tgb.complexdatalab.com/docs/leader_linkprop',
        'reference': 'https://github.com/shenyangHuang/TGB/blob/main/README.md?plain=1#L27'
    },
    {
        'leaderboard': 'https://github.com/vztu/BVQA_Benchmark',
        'reference': ''
    },
    {
        'leaderboard': 'https://rrc.cvc.uab.es',
        'reference': 'https://github.com/EriCongMa/awesome-transformer-ocr/blob/main/README.md?plain=1#L229'
    },
    {
        'leaderboard': 'https://gluebenchmark.com/leaderboard',
        'reference': 'https://github.com/yurakuratov/t5-experiments/blob/main/README.md?plain=1#L263'
    },
    {
        'leaderboard': 'https://github.com/open-compass/BotChat',
        'reference': ''
    },
    {
        'leaderboard': 'https://trustllmbenchmark.github.io/TrustLLM-Website/leaderboard.html',
        'reference': 'https://github.com/jphall663/awesome-machine-learning-interpretability/blob/master/README.md?plain=1#L1158'
    },
    {
        'leaderboard': 'https://www.aicrowd.com/challenges/music-demixing-challenge-ismir-2021/leaderboards',
        'reference': 'https://github.com/yoyololicon/music-demixing-challenge-ismir-2021-entry/blob/master/README.md?plain=1#L1'
    },
    {
        'leaderboard': 'https://www.cvlibs.net/datasets/kitti/eval_object.php?obj_benchmark=3d',
        'reference': 'https://github.com/mileyan/pseudo_lidar/blob/master/README.md?plain=1#L32'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/a-okvqa',
        'reference': 'https://github.com/allenai/aokvqa/blob/main/README.md?plain=1#L5'
    },
    {
        'leaderboard': 'https://www.aicrowd.com/challenges/seismic-facies-identification-challenge/leaderboards',
        'reference': 'https://github.com/AIcrowd/seismic-facies-identification-starter-kit/blob/master/README.md?plain=1#L8'
    },
    {
        'leaderboard': 'https://github.com/haoweiz23/Awesome-Fine-grained-Visual-Classification',
        'reference': ''
    },
    {
        'leaderboard': 'https://hfl-rc.github.io/cmrc2017/leaderboard',
        'reference': 'https://github.com/ymcui/Chinese-RC-Datasets/blob/master/README.md?plain=1#L63'
    },
    {
        'leaderboard': 'https://aistudio.baidu.com/competition/detail/720/0/leaderboard',
        'reference': 'https://github.com/ymcui/Chinese-RC-Datasets/blob/master/README.md?plain=1#L84'
    },
    {
        'leaderboard': 'https://hfl-rc.github.io/cmrc2018/open_challenge',
        'reference': 'https://github.com/ymcui/Chinese-RC-Datasets/blob/master/README.md?plain=1#L100'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/landmark-recognition-2020/leaderboard',
        'reference': 'https://github.com/bestfitting/instance_level_recognition/blob/main/README.md?plain=1#L5'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/baichuan-inc/Baichuan-7B/blob/main/README.md?plain=1#L128'
    },
    {
        'leaderboard': 'https://github.com/google-research-datasets/seahorse',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/netease-youdao/BCEmbedding',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/yxgeee/MMT-plus',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/infinigence/LVEval',
        'reference': ''
    },
    {
        'leaderboard': 'https://stanfordnlp.github.io/coqa',
        'reference': 'https://github.com/stevezheng23/xlnet_extension_tf/blob/master/README.md?plain=1#L2'
    },
    {
        'leaderboard': 'https://quac.ai',
        'reference': 'https://github.com/stevezheng23/xlnet_extension_tf/blob/master/README.md?plain=1#L4'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/mteb/leaderboard',
        'reference': 'https://github.com/CoIR-team/coir/blob/main/README.md?plain=1#L24'
    },
    {
        'leaderboard': 'https://archersama.github.io/coir',
        'reference': 'https://github.com/CoIR-team/coir/blob/main/README.md?plain=1#L24'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/Xwin-LM/Xwin-LM/blob/main/README.md?plain=1#L83'
    },
    {
        'leaderboard': 'https://www.aicrowd.com/challenges/food-recognition-benchmark-2022/leaderboards',
        'reference': 'https://github.com/AIcrowd/food-recognition-benchmark-starter-kit/blob/master/README.md?plain=1#L193'
    },
    {
        'leaderboard': 'https://leaderboard.carla.org/leaderboard',
        'reference': 'https://github.com/carla-simulator/scenario_runner/blob/master/README.md?plain=1#L49'
    },
    {
        'leaderboard': 'https://rajpurkar.github.io/SQuAD-explorer',
        'reference': 'https://github.com/Nagakiran1/Extending-Google-BERT-as-Question-and-Answering-model-and-Chatbot/blob/master/README.md?plain=1#L422'
    },
    {
        'leaderboard': 'https://github.com/yanyanSann/Long-Tailed-Classification-Leaderboard',
        'reference': 'https://github.com/Keke921/GCLLoss/blob/main/README.md?plain=1#L65'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/yongzhuo/qwen2-sft/blob/master/README.md?plain=1#L106'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/103/leaderboard',
        'reference': 'https://github.com/batra-mlp-lab/visdial/blob/master/README.md?plain=1#L293'
    },
    {
        'leaderboard': 'https://github.com/FormulaMonks/llm-benchmarker-suite',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/inspire-group/patch-defense-leaderboard',
        'reference': 'https://github.com/inspire-group/PatchGuard/blob/master/README.md?plain=1#L9'
    },
    {
        'leaderboard': 'https://github.com/open-mmlab/OpenUnReID/blob/master/docs/LEADERBOARD.md',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/declare-lab/instruct-eval',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/VITA-Group/Deep_GCN_Benchmarking',
        'reference': ''
    },
    {
        'leaderboard': 'https://dki-lab.github.io/GrailQA',
        'reference': 'https://github.com/microsoft/vert-papers/blob/master/README.md?plain=1#L16'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/Aligner2024/aligner/blob/master/README.md?plain=1#L9'
    },
    {
        'leaderboard': 'https://mathverse-cuhk.github.io/#leaderboard',
        'reference': 'https://github.com/ZrrSkywalker/MAVIS/blob/main/README.md?plain=1#L10'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/244/leaderboard',
        'reference': 'https://github.com/xinke-wang/Awesome-Text-VQA/blob/master/README.md?plain=1#L108'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/551/leaderboard',
        'reference': 'https://github.com/xinke-wang/Awesome-Text-VQA/blob/master/README.md?plain=1#L109'
    },
    {
        'leaderboard': 'https://rrc.cvc.uab.es/?ch=11&com=evaluation&task=1',
        'reference': 'https://github.com/xinke-wang/Awesome-Text-VQA/blob/master/README.md?plain=1#L129'
    },
    {
        'leaderboard': 'https://paperswithcode.com/dataset/popgym',
        'reference': 'https://github.com/proroklab/popgym/blob/master/README.md?plain=1#L76'
    },
    {
        'leaderboard': 'https://taolusi.github.io/CSpider-explorer',
        'reference': 'https://github.com/taolusi/chisp/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/mlabonne/llm-autoeval/blob/master/README.md?plain=1#L40'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/mlabonne/Yet_Another_LLM_Leaderboard',
        'reference': 'https://github.com/mlabonne/llm-autoeval/blob/master/README.md?plain=1#L67'
    },
    {
        'leaderboard': 'https://gluebenchmark.com/leaderboard',
        'reference': 'https://github.com/charles9n/bert-sklearn/blob/master/README.md?plain=1#L105'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/MIBlue119/awesome-llama-resources/blob/main/README.md?plain=1#L106'
    },
    {
        'leaderboard': 'https://ml.energy/leaderboard',
        'reference': 'https://github.com/AmberLJC/LLMSys-PaperList/blob/main/README.md?plain=1#L158'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/optimum/llm-perf-leaderboard',
        'reference': 'https://github.com/AmberLJC/LLMSys-PaperList/blob/main/README.md?plain=1#L159'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/AmberLJC/LLMSys-PaperList/blob/main/README.md?plain=1#L161'
    },
    {
        'leaderboard': 'https://crfm.stanford.edu/helm',
        'reference': 'https://github.com/AmberLJC/LLMSys-PaperList/blob/main/README.md?plain=1#L162'
    },
    {
        'leaderboard': 'https://lmarena.ai',
        'reference': 'https://github.com/AmberLJC/LLMSys-PaperList/blob/main/README.md?plain=1#L163'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/openlifescienceai/open_medical_llm_leaderboard',
        'reference': 'https://github.com/AI-in-Health/MedLLMsPracticalGuide/blob/main/README.md?plain=1#L269'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/ymcui/Chinese-LLaMA-Alpaca-3/blob/main/README.md?plain=1#L240'
    },
    {
        'leaderboard': 'https://github.com/RPC-Dataset/RPC-Leaderboard',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/alibaba/AICITY2024_Track2_AliOpenTrek_CityLLaVA',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/THUDM/SciGLM',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.hilti-challenge.com',
        'reference': 'https://github.com/Hilti-Research/hilti-slam-challenge-2021/blob/master/README.md?plain=1#L18'
    },
    {
        'leaderboard': 'https://github.com/thu-coai/Safety-Prompts',
        'reference': ''
    },
    {
        'leaderboard': 'https://opendrivelab.com/challenge2023',
        'reference': 'https://github.com/wenjie710/PivotNet/blob/main/README.md?plain=1#L8'
    },
    {
        'leaderboard': 'https://www.crowdbenchmark.com/nwpucrowdloc.html',
        'reference': 'https://github.com/taohan10200/Awesome-Crowd-Localization/blob/main/README.md?plain=1#L88'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/17672',
        'reference': 'https://github.com/cage-challenge/cage-challenge-4/blob/main/README.md?plain=1#L187'
    },
    {
        'leaderboard': 'https://leaderboard.carla.org/leaderboard',
        'reference': 'https://github.com/erdos-project/pylot/blob/master/README.md?plain=1#L266'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/NexaAIDev/domain_llm_leaderboard',
        'reference': 'https://github.com/NexaAI/octopus-v4/blob/main/README.md?plain=1#L26'
    },
    {
        'leaderboard': 'https://github.com/shikras/d-cube/tree/main/eval_sota',
        'reference': 'https://github.com/Charles-Xie/awesome-described-object-detection/blob/main/README.md?plain=1#L42'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/opencompass/open_vlm_leaderboard',
        'reference': 'https://github.com/scenarios/WeMM/blob/main/README.md?plain=1#L5'
    },
    {
        'leaderboard': 'https://opencompass.org.cn/leaderboard-multimodal',
        'reference': 'https://github.com/scenarios/WeMM/blob/main/README.md?plain=1#L15'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/THUDM/LongAlign/blob/main/README.md?plain=1#L106'
    },
    {
        'leaderboard': 'https://github.com/GAIR-NLP/OpenResearcher',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/lmsys/chatbot-arena-leaderboard',
        'reference': 'https://github.com/Hannibal046/Awesome-LLM/blob/main/README.md?plain=1#L132'
    },
    {
        'leaderboard': 'https://mixeval.github.io/#leaderboard',
        'reference': 'https://github.com/Hannibal046/Awesome-LLM/blob/main/README.md?plain=1#L133'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/Hannibal046/Awesome-LLM/blob/main/README.md?plain=1#L134'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/Hannibal046/Awesome-LLM/blob/main/README.md?plain=1#L136'
    },
    {
        'leaderboard': 'https://rank.opencompass.org.cn/leaderboard-llm',
        'reference': 'https://github.com/Hannibal046/Awesome-LLM/blob/main/README.md?plain=1#L137'
    },
    {
        'leaderboard': 'https://gorilla.cs.berkeley.edu/leaderboard.html',
        'reference': 'https://github.com/Hannibal046/Awesome-LLM/blob/main/README.md?plain=1#L138'
    },
    {
        'leaderboard': 'https://github.com/svilupp/Julia-LLM-Leaderboard',
        'reference': 'https://github.com/svilupp/awesome-generative-ai-meets-julia-language/blob/main/README.md?plain=1#L95'
    },
    {
        'leaderboard': 'https://github.com/ethz-spylab/rlhf_trojan_competition',
        'reference': ''
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/463/leaderboard',
        'reference': 'https://github.com/zd11024/NaviLLM/blob/main/README.md?plain=1#L80'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1715/leaderboard',
        'reference': 'https://github.com/zd11024/NaviLLM/blob/main/README.md?plain=1#L80'
    },
    {
        'leaderboard': 'https://github.com/bcmi/Image-Harmonization-Dataset-iHarmony4',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.nuscenes.org/object-detection',
        'reference': 'https://github.com/nv-tlabs/planning-centric-metrics/blob/master/README.md?plain=1#L26'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/global-wheat-detection/leaderboard',
        'reference': 'https://github.com/liaopeiyuan/TransferDet/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://github.com/adobe-research/deft_corpus',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/yongzhuo/LLM-SFT/blob/main/README.md?plain=1#L71'
    },
    {
        'leaderboard': 'https://lmarena.ai',
        'reference': 'https://github.com/CLUEbenchmark/SuperCLUE-Llama2-Chinese/blob/main/README.md?plain=1#L120'
    },
    {
        'leaderboard': 'https://lv-mhp.github.io/human_parsing_lb',
        'reference': 'https://github.com/ZhaoJ9014/Multi-Human-Parsing/blob/master/README.md?plain=1#L71'
    },
    {
        'leaderboard': 'https://bop.felk.cvut.cz/leaderboards/pose-estimation-unseen-bop23/core-datasets',
        'reference': 'https://github.com/NVlabs/FoundationPose/blob/main/readme.md?plain=1#L16'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/seizure-prediction/leaderboard',
        'reference': 'https://github.com/april-org/april-ann/blob/master/README.md?plain=1#L299'
    },
    {
        'leaderboard': 'https://github.com/romainloiseau/HelixNet',
        'reference': ''
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/visual-object-tracking-on-lasot',
        'reference': 'https://github.com/Little-Podi/AiATrack/blob/main/README.md?plain=1#L25'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/visual-object-tracking-on-trackingnet',
        'reference': 'https://github.com/Little-Podi/AiATrack/blob/main/README.md?plain=1#L27'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/visual-object-tracking-on-got-10k',
        'reference': 'https://github.com/Little-Podi/AiATrack/blob/main/README.md?plain=1#L28'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/visual-object-tracking-on-needforspeed',
        'reference': 'https://github.com/Little-Podi/AiATrack/blob/main/README.md?plain=1#L29'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/visual-object-tracking-on-otb-100',
        'reference': 'https://github.com/Little-Podi/AiATrack/blob/main/README.md?plain=1#L30'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/visual-object-tracking-on-uav123',
        'reference': 'https://github.com/Little-Podi/AiATrack/blob/main/README.md?plain=1#L31'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L112'
    },
    {
        'leaderboard': 'https://microsoft.github.io/GLUECoS',
        'reference': ''
    },
    {
        'leaderboard': 'https://hkust-nlp.github.io/agentboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L174'
    },
    {
        'leaderboard': 'https://artificialanalysis.ai/text-to-image',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L176'
    },
    {
        'leaderboard': 'https://scale.com/leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L177'
    },
    {
        'leaderboard': 'https://crfm.stanford.edu/helm',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L178'
    },
    {
        'leaderboard': 'https://www.vals.ai',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L179'
    },
    {
        'leaderboard': 'https://trustllmbenchmark.github.io/TrustLLM-Website/leaderboard.html',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L180'
    },
    {
        'leaderboard': 'https://lmarena.ai',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L181'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L182'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/optimum/llm-perf-leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L183'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/hallucinations-leaderboard/leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L184'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/NPHardEval/NPHardEval-leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L185'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/AI-Secure/llm-trustworthy-leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L186'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/openlifescienceai/open_medical_llm_leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L187'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/gaia-benchmark/leaderboard',
        'reference': 'https://github.com/PetroIvaniuk/llms-tools/blob/main/README.md?plain=1#L189'
    },
    {
        'leaderboard': 'https://superbbenchmark.org/leaderboard',
        'reference': 'https://github.com/mechanicalsea/lighthubert/blob/main/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://github.com/PengYu-Team/Co-LRIO',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/dvlab-research/DSGN',
        'reference': ''
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/3d-lane-detection-on-openlane',
        'reference': 'https://github.com/OpenDriveLab/OpenLane/blob/main/README.md?plain=1#L24'
    },
    {
        'leaderboard': 'https://lmarena.ai',
        'reference': 'https://github.com/shure-dev/Awesome-LLM-Papers-Comprehensive-Topics/blob/main/README.md?plain=1#L239'
    },
    {
        'leaderboard': 'https://github.com/LudwigStumpp/llm-leaderboard',
        'reference': 'https://github.com/shure-dev/Awesome-LLM-Papers-Comprehensive-Topics/blob/main/README.md?plain=1#L413'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/Abdullahw72/langchain-chatbot-multiple-PDF/blob/master/README.md?plain=1#L56'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/propara',
        'reference': 'https://github.com/allenai/propara/blob/master/README.md?plain=1#L12'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/scifact',
        'reference': 'https://github.com/allenai/scifact/blob/master/README.md?plain=1#L33'
    },
    {
        'leaderboard': 'https://hkust-nlp.github.io/agentboard',
        'reference': 'https://github.com/hkust-nlp/AgentBoard/blob/main/README.md?plain=1#L18'
    },
    {
        'leaderboard': 'https://adeval.cstcloud.cn/content/leaderboard',
        'reference': 'https://github.com/dawnvince/EasyTSAD/blob/main/README.md?plain=1#L27'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/GeneZC/MiniMA/blob/main/README.md?plain=1#L58'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/GeneZC/MiniMA/blob/main/README.md?plain=1#L62'
    },
    {
        'leaderboard': 'https://github.com/deepchem/moleculenet',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/CLUEbenchmark/CLUE',
        'reference': ''
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/454/leaderboard',
        'reference': 'https://github.com/Henry1iu/TNT-Trajectory-Prediction/blob/main/README.md?plain=1#L25'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/thestriver/ai-for-javascript-course/blob/main/README.md?plain=1#L411'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/thestriver/ai-for-javascript-course/blob/main/README.md?plain=1#L413'
    },
    {
        'leaderboard': 'https://www.cvlibs.net/datasets/kitti/eval_scene_flow.php',
        'reference': 'https://github.com/jiahaopang/crl/blob/master/README.md?plain=1#L28'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/visual-entailment-on-snli-ve-val',
        'reference': 'https://github.com/necla-ml/SNLI-VE/blob/master/README.md?plain=1#L26'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1938/leaderboard',
        'reference': 'https://github.com/buildingnet/buildingnet_dataset/blob/main/README.md?plain=1#L16'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1663/leaderboard',
        'reference': 'https://github.com/alexa/alexa-with-dstc9-track1-dataset/blob/master/README.md?plain=1#L13'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/mteb/leaderboard',
        'reference': 'https://github.com/skeskinen/llama-lite/blob/master/README.md?plain=1#L67'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/optimum/llm-perf-leaderboard',
        'reference': 'https://github.com/samuelrince/awesome-green-ai/blob/main/README.md?plain=1#L87'
    },
    {
        'leaderboard': 'https://ml.energy/leaderboard',
        'reference': 'https://github.com/samuelrince/awesome-green-ai/blob/main/README.md?plain=1#L88'
    },
    {
        'leaderboard': 'https://sites.google.com/view/pgdl2020/leaderboard',
        'reference': 'https://github.com/parthnatekar/pgdl/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://sites.google.com/view/pgdl2020/leaderboard',
        'reference': 'https://github.com/z-x-yang/AOT/blob/main/README.md?plain=1#L29'
    },
    {
        'leaderboard': 'https://github.com/ws-choi/Conditioned-Source-Separation-LaSAFT',
        'reference': ''
    },
    {
        'leaderboard': 'https://eu.aihub.ml/competitions/201',
        'reference': 'https://github.com/z-x-yang/AOT/blob/main/README.md?plain=1#L29'
    },
    {
        'leaderboard': 'https://eu.aihub.ml/competitions/201',
        'reference': 'https://github.com/z-x-yang/AOT/blob/main/README.md?plain=1#L31'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/606/leaderboard',
        'reference': 'https://github.com/YuankaiQi/REVERIE/blob/master/README.md?plain=1#L8'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/2049/leaderboard',
        'reference': 'https://github.com/eric-ai-lab/Aerial-Vision-and-Dialog-Navigation/blob/origin/README.md?plain=1#L16'
    },
    {
        'leaderboard': 'https://github.com/robot-pesg/BotanicGarden/tree/main/leaderboard',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.cvlibs.net/datasets/kitti/eval_object.php?obj_benchmark=3d',
        'reference': 'https://github.com/sshaoshuai/PointRCNN/blob/master/README.md?plain=1#L18'
    },
    {
        'leaderboard': 'https://rrc.cvc.uab.es/?ch=17&com=evaluation&task=4',
        'reference': 'https://github.com/rubenpt91/MP-DocVQA-Framework/blob/master/readme.md?plain=1#L39'
    },
    {
        'leaderboard': 'https://rajpurkar.github.io/SQuAD-explorer',
        'reference': 'https://github.com/allenai/document-qa/blob/master/README.md?plain=1#L167'
    },
    {
        'leaderboard': 'https://github.com/pangeo-data/WeatherBench',
        'reference': ''
    },
    {
        'leaderboard': 'https://cares-ai.github.io/#leaderboard',
        'reference': 'https://github.com/richard-peng-xia/CARES/blob/main/README.md?plain=1#L12'
    },
    {
        'leaderboard': 'https://github.com/GAIR-NLP/benbench',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/eduagarcia/open_pt_llm_leaderboard',
        'reference': 'https://github.com/ajdavidl/Portuguese-NLP/blob/main/README.md?plain=1#L237'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/97/leaderboard',
        'reference': 'https://github.com/peteanderson80/Matterport3DSimulator/blob/master/README.md?plain=1#L50'
    },
    {
        'leaderboard': 'https://github.com/Master-PLC/FreDF',
        'reference': ''
    },
    {
        'leaderboard': 'https://lmarena.ai',
        'reference': 'https://github.com/eugeneyan/open-llms/blob/main/README.md?plain=1#L109'
    },
    {
        'leaderboard': 'https://twitter.com/jefrankle/status/1654631746506301441',
        'reference': 'https://github.com/eugeneyan/open-llms/blob/main/README.md?plain=1#L110'
    },
    {
        'leaderboard': 'https://crfm.stanford.edu/helm',
        'reference': 'https://github.com/eugeneyan/open-llms/blob/main/README.md?plain=1#L111'
    },
    {
        'leaderboard': 'https://github.com/LudwigStumpp/llm-leaderboard',
        'reference': 'https://github.com/eugeneyan/open-llms/blob/main/README.md?plain=1#L112'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/eugeneyan/open-llms/blob/main/README.md?plain=1#L114'
    },
    {
        'leaderboard': 'https://github.com/lfy79001/TableQAKit',
        'reference': ''
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/open_book_qa',
        'reference': 'https://github.com/allenai/OpenBookQA/blob/main/README.md?plain=1#L16'
    },
    {
        'leaderboard': 'http://www.cvlibs.net/datasets/kitti/eval_tracking.php',
        'reference': 'https://github.com/aleksandrkim61/EagerMOT/blob/open_main/README.md?plain=1#L27'
    },
    {
        'leaderboard': 'https://www.nuscenes.org/tracking',
        'reference': 'https://github.com/aleksandrkim61/EagerMOT/blob/open_main/README.md?plain=1#L28'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/thunlp/UltraChat/blob/main/README.md?plain=1#L35'
    },
    {
        'leaderboard': 'https://github.com/jiachens/ModelNet40-C',
        'reference': ''
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/mteb/leaderboard',
        'reference': 'https://github.com/Anush008/fastembed-go/blob/main/README.md?plain=1#L18'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/830/leaderboard',
        'reference': 'https://github.com/microsoft/unilm/blob/master/README.md?plain=1#L139'
    },
    {
        'leaderboard': 'https://superbbenchmark.org/leaderboard',
        'reference': 'https://github.com/microsoft/unilm/blob/master/README.md?plain=1#L143'
    },
    {
        'leaderboard': 'https://sites.research.google/xtreme',
        'reference': 'https://github.com/microsoft/unilm/blob/master/README.md?plain=1#L146'
    },
    {
        'leaderboard': 'https://rrc.cvc.uab.es/?ch=17&com=evaluation&task=1',
        'reference': 'https://github.com/microsoft/unilm/blob/master/README.md?plain=1#L158'
    },
    {
        'leaderboard': 'https://rrc.cvc.uab.es/?ch=13&com=evaluation&task=3',
        'reference': 'https://github.com/microsoft/unilm/blob/master/README.md?plain=1#L158'
    },
    {
        'leaderboard': 'https://rajpurkar.github.io/SQuAD-explorer',
        'reference': 'https://github.com/duyunshu/bert-sentiment-analysis/blob/master/README.md?plain=1#L158'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/code-generation-on-humaneval',
        'reference': 'https://github.com/alekst23/simple-coder/blob/main/README.md?plain=1#L15'
    },
    {
        'leaderboard': 'https://hotpotqa.github.io',
        'reference': 'https://github.com/woshiyyya/DFGN-pytorch/blob/master/readme.md?plain=1#L15'
    },
    {
        'leaderboard': 'https://tatsu-lab.github.io/alpaca_eval',
        'reference': 'https://github.com/eugeneyan/llm-paper-notes/blob/main/README.md?plain=1#L94'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/smartyfh/LLM-Uncertainty-Bench/blob/main/README.md?plain=1#L24'
    },
    {
        'leaderboard': 'https://www.swebench.com',
        'reference': 'https://github.com/aorwall/moatless-tools/blob/main/README.md?plain=1#L5'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/HqWu-HITCS/Awesome-Chinese-LLM/blob/main/README.md?plain=1#L1067'
    },
    {
        'leaderboard': 'https://lvbench.github.io/#leaderboard',
        'reference': 'https://github.com/THUDM/LVBench/blob/main/README.md?plain=1#L11'
    },
    {
        'leaderboard': 'https://github.com/cbvrp-acmmm-2019/cbvrp-acmmm-2019',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/jigsaw-unintended-bias-in-toxicity-classification/leaderboard',
        'reference': 'https://github.com/thuwyh/Jigsaw-Unintended-Bias-in-Toxicity-Classification/blob/master/README.md?plain=1#L2'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/openlifescienceai/open_medical_llm_leaderboard',
        'reference': 'https://github.com/TsinghuaC3I/UltraMedical/blob/main/README.md?plain=1#L129'
    },
    {
        'leaderboard': 'https://leaderboard.carla.org/leaderboard',
        'reference': 'https://github.com/autonomousvision/carla_garage/blob/main/README.md?plain=1#L176'
    },
    {
        'leaderboard': 'https://github.com/yuh-zha/AlignScore',
        'reference': ''
    },
    {
        'leaderboard': 'https://cocodataset.org/#captions-leaderboard',
        'reference': 'https://github.com/peteanderson80/Up-Down-Captioner/blob/master/README.md?plain=1#L3'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/mike-ravkine/can-ai-code-results',
        'reference': 'https://github.com/the-crypt-keeper/can-ai-code/blob/main/README.md?plain=1#L37'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/allenai/WildBench',
        'reference': 'https://github.com/allenai/WildBench/blob/main/README.md?plain=1#L8'
    },
    {
        'leaderboard': 'https://paperswithcode.com/task/node-classification-on-non-homophilic',
        'reference': 'https://github.com/SitaoLuan/ACM-GNN/blob/main/README.md?plain=1#L129'
    },
    {
        'leaderboard': 'https://waymo.com/open/challenges/2020/3d-detection',
        'reference': 'https://github.com/PJLab-ADG/LoGoNet/blob/main/README.md?plain=1#L14'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/3d-depth-estimation-on-relative-human',
        'reference': 'https://github.com/Arthur151/Relative_Human/blob/master/README.md?plain=1#L27'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/mteb/leaderboard',
        'reference': 'https://github.com/infrawhispers/anansi/blob/main/README.md?plain=1#L30'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/google-quest-challenge/leaderboard',
        'reference': 'https://github.com/oleg-yaroshevskiy/quest_qa_labeling/blob/master/README.md?plain=1#L109'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/jincheng9/gpt-tutorial/blob/main/README.md?plain=1#L114'
    },
    {
        'leaderboard': 'https://www.aicrowd.com/challenges/unity-obstacle-tower-challenge/leaderboards',
        'reference': 'https://github.com/Unity-Technologies/obstacle-tower-source/blob/master/README.md?plain=1#L40'
    },
    {
        'leaderboard': 'https://www.aicrowd.com/challenges/neurips-2021-minerl-diamond-competition/leaderboards',
        'reference': 'https://github.com/minerllabs/competition_submission_template/blob/master/README.md?plain=1#L14'
    },
    {
        'leaderboard': 'http://host.robots.ox.ac.uk:8080/leaderboard/displaylb_dt.php?challengeid=6&compid=4',
        'reference': 'https://github.com/rbgirshick/rcnn/blob/master/README.md?plain=1#L39'
    },
    {
        'leaderboard': 'http://host.robots.ox.ac.uk:8080/leaderboard/displaylb_dt.php?challengeid=11&compid=4',
        'reference': 'https://github.com/rbgirshick/rcnn/blob/master/README.md?plain=1#40'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/robothor_objectnav',
        'reference': 'https://github.com/allenai/robothor-challenge/blob/main/README.md?plain=1#L105'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/math-word-problem-solving-on-svamp',
        'reference': 'https://github.com/chuanyang-Zheng/Progressive-Hint/blob/main/README.md?plain=1#L32'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/arithmetic-reasoning-on-gsm8k',
        'reference': 'https://github.com/chuanyang-Zheng/Progressive-Hint/blob/main/README.md?plain=1#L32'
    },
    {
        'leaderboard': 'https://paperswithcode.com/sota/math-word-problem-solving-on-math',
        'reference': 'https://github.com/chuanyang-Zheng/Progressive-Hint/blob/main/README.md?plain=1#L32'
    },
    {
        'leaderboard': 'https://mmbench.opencompass.org.cn/leaderboard',
        'reference': 'https://github.com/codefuse-ai/CodeFuse-MFT-VLM/blob/master/README.md?plain=1#L16'
    },
    {
        'leaderboard': 'https://github.com/codefuse-ai/codefuse-devops-eval',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/feedback-prize-2021/leaderboard',
        'reference': 'https://github.com/affjljoo3581/Feedback-Prize-Competition/blob/master/README.md?plain=1#L5'
    },
    {
        'leaderboard': 'https://gluebenchmark.com/leaderboard',
        'reference': 'https://github.com/microsoft/MT-DNN/blob/master/README.md?plain=1#L227'
    },
    {
        'leaderboard': 'https://github.com/AI-secure/Certified-Robustness-SoK-Oldver',
        'reference': ''
    },
    {
        'leaderboard': 'https://sokcertifiedrobustness.github.io/leaderboard',
        'reference': 'https://github.com/AI-secure/Certified-Robustness-SoK-Oldver/blob/master/README.md?plain=1#L1'
    },
    {
        'leaderboard': 'https://ml.energy/leaderboard',
        'reference': 'https://github.com/Green-Software-Foundation/awesome-green-software/blob/main/readme.md?plain=1#L125'
    },
    {
        'leaderboard': 'https://waymo.com/open/challenges/2020/3d-detection',
        'reference': 'https://github.com/ADLab-AutoDrive/INT/blob/main/README.md?plain=1#L37'
    },
    {
        'leaderboard': 'https://waymo.com/open/challenges/2023/motion-prediction',
        'reference': 'https://github.com/zhejz/HPTR/blob/main/README.md?plain=1#L26'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/1719/leaderboard',
        'reference': 'https://github.com/zhejz/HPTR/blob/main/README.md?plain=1#L69'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/yentinglin/open-tw-llm-leaderboard',
        'reference': 'https://github.com/MiuLab/Taiwan-LLM/blob/main/README.md?plain=1#L77'
    },
    {
        'leaderboard': 'https://www.kaggle.com/c/home-credit-default-risk/leaderboard',
        'reference': 'https://github.com/KazukiOnodera/Home-Credit-Default-Risk/blob/master/README.md?plain=1#L2'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/4318',
        'reference': 'https://github.com/shreyashampali/kypt_transformer/blob/master/README.md?plain=1#L120'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/4897',
        'reference': 'https://github.com/shreyashampali/kypt_transformer/blob/master/README.md?plain=1#L138'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/689/leaderboard',
        'reference': 'https://github.com/martiansideofthemoon/hurdles-longform-qa/blob/main/README.md?plain=1#L115'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/6738',
        'reference': 'https://github.com/psunlpgroup/MultiHiertt/blob/main/README.md?plain=1#L13'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/sci-m-wang/LangGPT-tools/blob/main/README.md?plain=1#L29'
    },
    {
        'leaderboard': 'https://skyworkai.github.io/agent-studio',
        'reference': 'https://github.com/SkyworkAI/agent-studio/blob/main/README.md?plain=1#L39'
    },
    {
        'leaderboard': 'https://flageval.baai.ac.cn/#/leaderboard/multimodal',
        'reference': 'https://github.com/Kwai-Kolors/Kolors/blob/master/README.md?plain=1#L60'
    },
    {
        'leaderboard': 'https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard',
        'reference': 'https://github.com/wel3kxial/AIGC_Resources/blob/main/README.md?plain=1#L758'
    },
    {
        'leaderboard': 'https://github.com/THUDM/ReST-MCTS',
        'reference': ''
    },
    {
        'leaderboard': 'https://www.cluebenchmarks.com',
        'reference': 'https://github.com/aymericdamien/TopDeepLearning/blob/master/README.md?plain=1#L733'
    },
    {
        'leaderboard': 'https://github.com/lampts/my_dl_solutions',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/DengPingFan/DAVSOD',
        'reference': ''
    },
    {
        'leaderboard': 'http://convai.io',
        'reference': 'https://github.com/aliannejadi/ClariQ/blob/master/README.md?plain=1#L475'
    },
    {
        'leaderboard': 'http://got-10k.aitestunion.com/leaderboard',
        'reference': 'https://github.com/got-10k/siamfc/blob/master/README.md?plain=1#L13'
    },
    {
        'leaderboard': 'https://github.com/SiatMMLab/Awesome-Diffusion-Model-Based-Image-Editing-Methods/blob/main/Leaderboard.md',
        'reference': ''
    },
    {
        'leaderboard': 'https://klue-benchmark.com/leaderboard',
        'reference': 'https://github.com/KLUE-benchmark/KLUE/blob/main/README.md?plain=1#L70'
    },
    {
        'leaderboard': 'https://crux-eval.github.io/leaderboard.html',
        'reference': 'https://github.com/facebookresearch/cruxeval/blob/main/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://github.com/inspire-group/patch-defense-leaderboard',
        'reference': 'https://github.com/inspire-group/PatchCleanser/blob/main/README.md?plain=1#L27'
    },
    {
        'leaderboard': 'https://github.com/Magnetic2014/RoleEval',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/SoccerNet/sn-spotting',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/sejong-rcv/MLPD-Multi-Label-Pedestrian-Detection',
        'reference': ''
    },
    {
        'leaderboard': 'https://rajpurkar.github.io/SQuAD-explorer',
        'reference': 'https://github.com/dallascard/NLP-power-analysis/blob/master/README.md?plain=1#L43'
    },
    {
        'leaderboard': 'https://www.aicrowd.com/challenges/imageclef-2019-vqa-med/leaderboards',
        'reference': 'https://github.com/abachaa/VQA-Med-2019/blob/master/README.md?plain=1#L6'
    },
    {
        'leaderboard': 'https://ogb.stanford.edu/docs/leader_nodeprop/#ogbn-arxiv',
        'reference': 'https://github.com/ytchx1999/PyG-OGB-Tricks/blob/main/README.md?plain=1#L20'
    },
    {
        'leaderboard': 'hhttps://ogb.stanford.edu/docs/leader_nodeprop/#ogbn-mag',
        'reference': 'https://github.com/ytchx1999/PyG-OGB-Tricks/blob/main/README.md?plain=1#L25'
    },
    {
        'leaderboard': 'https://ogb.stanford.edu/docs/leader_nodeprop/#ogbn-products',
        'reference': 'https://github.com/ytchx1999/PyG-OGB-Tricks/blob/main/README.md?plain=1#L30'
    },
    {
        'leaderboard': 'https://ogb.stanford.edu/docs/leader_nodeprop/#ogbn-proteins',
        'reference': 'https://github.com/ytchx1999/PyG-OGB-Tricks/blob/main/README.md?plain=1#L36'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/514/leaderboard',
        'reference': 'https://github.com/pzzhang/VinVL/blob/main/README.md?plain=1#L31'
    },
    {
        'leaderboard': 'https://eval.ai/web/challenges/challenge-page/355/leaderboard',
        'reference': 'https://github.com/pzzhang/VinVL/blob/main/README.md?plain=1#L31'
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/vcr',
        'reference': 'https://github.com/pzzhang/VinVL/blob/main/README.md?plain=1#L31'
    },
    {
        'leaderboard': 'https://github.com/layer6ai-labs/dgm-eval',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/salesforce/decaNLP',
        'reference': ''
    },
    {
        'leaderboard': 'https://leaderboard.carla.org/leaderboard',
        'reference': 'https://github.com/carla-simulator/carla/blob/dev/README.md?plain=1#L50'
    },
    {
        'leaderboard': 'https://github.com/eugenesiow/super-image',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/liuye6666/EWR-PGD',
        'reference': ''
    },
    {
        'leaderboard': 'http://host.robots.ox.ac.uk:8080/leaderboard/displaylb.php?challengeid=11&compid=6',
        'reference': 'https://github.com/TheLegendAli/DeepLab-Context/blob/master/README.md?plain=1#L39'
    },
    {
        'leaderboard': 'https://github.com/SoccerNet/sn-tracking',
        'reference': ''
    },
    {
        'leaderboard': 'https://leaderboard.allenai.org/mctaco',
        'reference': 'https://github.com/CogComp/MCTACO/blob/master/README.md?plain=1#L9'
    },
    {
        'leaderboard': 'https://cl-detection2023.grand-challenge.org/evaluation/challenge/leaderboard',
        'reference': 'https://github.com/5k5000/CLdetection2023/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://cl-detection2023.grand-challenge.org/evaluation/testing/leaderboard',
        'reference': 'https://github.com/5k5000/CLdetection2023/blob/master/README.md?plain=1#L7'
    },
    {
        'leaderboard': 'https://sokcertifiedrobustness.github.io/leaderboard',
        'reference': 'https://github.com/yinizhilian/ICLR2024-Papers-with-Code/blob/main/README.md?plain=1#L2853'
    },
    {
        'leaderboard': 'https://codalab.lisn.upsaclay.fr/competitions/7395',
        'reference': 'https://github.com/thunlp/Knowledge-Plugin/blob/master/README.md?plain=1#L137'
    },
    {
        'leaderboard': 'https://github.com/Kali-Hac/Awesome-Skeleton-Based-Models/tree/main/skeleton-based-action-recognition',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/Kali-Hac/Awesome-Skeleton-Based-Models/tree/main/3D-pose-estimation',
        'reference': ''
    },
    {
        'leaderboard': 'https://github.com/Kali-Hac/Awesome-Skeleton-Based-Models/tree/main/skeleton-based-person-reID',
        'reference': ''
    },
    {
        'leaderboard': 'https://nl2sql360.github.io/#leaderboard',
        'reference': 'https://github.com/HKUSTDial/NL2SQL360/blob/master/README.md?plain=1#L15'
    },
    {
        'leaderboard': 'https://github.com/yanyanSann/Long-Tailed-Classification-Leaderboard',
        'reference': 'https://github.com/zhangyongshun/BagofTricks-LT/blob/main/README.md?plain=1#L309'
    },
    {
        'leaderboard': 'https://teddy-xionggz.github.io/MIRAGE',
        'reference': 'https://github.com/Teddy-XiongGZ/MIRAGE/blob/main/README.md?plain=1#L115'
    },
]

leaderboard_secondary = [
    {
        'original': 'https://gluebenchmark.com/leaderboard',
        'descendants': ['https://super.gluebenchmark.com/leaderboard']
    },
    {
        'original': 'https://www.cluebenchmarks.com',
        'descendants': ['https://www.superclueai.com', 'https://github.com/CLUEbenchmark/SuperCLUEgkzw', 'https://www.langyb.com']
    },
    {
        'original': 'https://rank.opencompass.org.cn/leaderboard-llm',
        'descendants': ['https://rank.opencompass.org.cn/leaderboard-llm-academic', 'https://rank.opencompass.org.cn/leaderboard-arena', 'https://rank.opencompass.org.cn/leaderboard-multimodal']
    },
    {
        'original': 'https://artificialanalysis.ai/text-to-image',
        'descendants': ['https://artificialanalysis.ai/leaderboards/models', 'https://artificialanalysis.ai/leaderboards/providers', 'https://artificialanalysis.ai/speech-to-text', 'https://artificialanalysis.ai/text-to-speech']
    },
    {
        'original': 'https://flageval.baai.ac.cn/#/leaderboard/multimodal',
        'descendants': ['https://flageval.baai.ac.cn/#/leaderboard/nlp-capability', 'https://flageval.baai.ac.cn/#/leaderboard/k12']
    },
]

In [18]:
print(f'There are {len(dataset_oriented_leaderboards)} dataset-oriented leaderboards.')
print(f'There are {len(method_oriented_leaderboards)} method-oriented leaderboards.')
print(f'There are {len(metric_oriented_leaderboards)} metric-oriented leaderboards.')
# There are 402 EvalAI + 648 Kaggle + 1 TAOST + 5 Artificial Analysis + rest = 1062 solution-oriented leaderboards.
# There are 5312 PapersWithCode + 78 GitHub + 336 HuggingFace + 49 Independent = 5775 model-oriented leaderboards.

There are 4 dataset-oriented leaderboards.
There are 15 method-oriented leaderboards.
There are 1 metric-oriented leaderboards.


In [19]:
with pd.ExcelFile(path_meta / 'Foundation Model Leaderboards.xlsx') as excel_file:
    df_leaderboard = pd.read_excel(excel_file, sheet_name='Leaderboard')

    df_leaderboard_expanded = []
    for idx, row in df_leaderboard.iterrows():
        task = row['Name']
        if task in pwc_leaderboard_mapping and row['Platforms'] == 'pwc':
            sub_names = pwc_leaderboard_mapping[task]
            for sub_name in sub_names:
                new_row = row.copy()
                new_row['Name'] = sub_name
                df_leaderboard_expanded.append(new_row)
        else:
            df_leaderboard_expanded.append(row)

    df_leaderboard_expanded = pd.DataFrame(df_leaderboard_expanded)
    df_leaderboard_expanded.to_csv(path_meta / 'leaderboard_processed.csv', index=False)

In [20]:
leaderboard_hosted_on_multiple_platforms = 0
leaderboard_without_model_linkage = 0
leaderboard_host_platform_mapping = defaultdict(int)

df_leaderboard_expanded = pd.read_csv(path_meta / 'leaderboard_processed.csv')
df_leaderboard_expanded['Development workflows (non-pwc)'] = df_leaderboard_expanded['Development workflows (non-pwc)'].astype(str).apply(string_to_list)
df_leaderboard_expanded['Display formats (non-pwc)'] = df_leaderboard_expanded['Display formats (non-pwc)'].apply(lambda x: string_to_dict(x, list_format=True))
df_leaderboard_expanded['Publication venues (non-pwc)'] = df_leaderboard_expanded['Publication venues (non-pwc)'].apply(string_to_list)
df_leaderboard_expanded['Release organizations (non-pwc)'] = df_leaderboard_expanded['Release organizations (non-pwc)'].apply(string_to_list)

df_leaderboard_expanded['Display formats'] = [[] for _ in range(len(df_leaderboard_expanded))]
df_leaderboard_expanded['Development workflows'] = [[] for _ in range(len(df_leaderboard_expanded))]
df_leaderboard_expanded['Release organizations'] = [[] for _ in range(len(df_leaderboard_expanded))]

for index, row in df_leaderboard_expanded.iterrows():
    display_formats = set(row['Display formats (non-pwc)'])
    publishers = publisher_synonyms_mapping(row['Release organizations (non-pwc)'])
    workflows = set(row['Development workflows (non-pwc)'])
        
    for platform in row['Platforms'].split(','):
        leaderboard_host_platform_mapping[platform] += 1
            
    if len(row['Platforms'].split(',')) > 1:
        leaderboard_hosted_on_multiple_platforms += 1
        
    if row['Platforms'] == 'pwc':
        publishers.add('Papers With Code')
            
    if 'pwc' in row['Platforms']:
        display_formats = display_formats.union(display_format_pwc)
        workflows = workflows.union(workflow_pwc)
    elif pd.isna(row['Model linkage (non-pwc)']):
        leaderboard_without_model_linkage += 1

    df_leaderboard_expanded.at[index, 'Display formats'] = list(display_formats)
    df_leaderboard_expanded.at[index, 'Development workflows'] = list(workflows)
    df_leaderboard_expanded.at[index, 'Release organizations'] = list(publishers)

df_leaderboard_expanded.to_csv(path_meta / 'leaderboard_processed.csv', index=False)

print(f"Total number of leaderboards: {len(df_leaderboard_expanded)}")
print(f"{round(leaderboard_without_model_linkage/len(df_leaderboard_expanded)*100,2)}% ({leaderboard_without_model_linkage} out of {len(df_leaderboard_expanded)}) leaderboards do not have any model provenence links.")
print(f"{round(leaderboard_hosted_on_multiple_platforms/len(df_leaderboard_expanded)*100,2)}% ({leaderboard_hosted_on_multiple_platforms} out of {len(df_leaderboard_expanded)}) leaderboards are hosted on multiple platforms.")

leaderboard_distribution = df_leaderboard_expanded['Platforms'].value_counts().to_dict()

fig = px.bar(
    x=leaderboard_distribution.keys(),
    y=leaderboard_distribution.values(),
    text_auto=True,
    labels={'x': 'Host Platforms', 'y': 'Number of Leaderboards'},
)
# Update the layout for a tighter look
fig.update_layout(
    autosize=True,
    margin=dict(
        l=10,  # Left margin
        r=10,  # Right margin
        b=10,  # Bottom margin
        t=10,  # Top margin
        pad=4  # Padding between the plot and the margin
    ),
    xaxis=dict(title_font=dict(size=18, family='Arial, bold', color='black'),tickfont=dict(color='black')),
    yaxis=dict(title_font=dict(size=18, family='Arial, bold', color='black'),tickfont=dict(color='black')),
)
pio.write_image(fig, f'{path_meta}/platform-combo-distribution.pdf')
fig.update_layout(
    width=1200,  # Set the width of the figure
    height=800,  # Set the height of the figure
)
fig.show()

for key, value in leaderboard_host_platform_mapping.items():
    print(f"{key.upper()}: {value} ({round(value/len(df_leaderboard_expanded)*100,2)}%)")

Total number of leaderboards: 721
16.64% (120 out of 721) leaderboards do not have any model provenence links.
7.91% (57 out of 721) leaderboards are hosted on multiple platforms.


HF: 120 (16.64%)
GH: 120 (16.64%)
PWC: 446 (61.86%)
IP: 96 (13.31%)


In [21]:
df = pd.read_csv(path_meta / 'leaderboard_processed.csv')
df['Development workflows'] = df['Development workflows'].apply(ast.literal_eval)

# df = df[df['Development workflows'].map(len) > 0]
df_workflow = df.explode('Development workflows')
df_workflow = df_workflow.groupby('Development workflows').size().reset_index(name='Frequency')
df_workflow['Development workflows'] = df_workflow['Development workflows'].apply(lambda x: f'Pattern {x}' if x != 'Unknown' else x)
df_workflow.sort_values(by='Frequency', ascending=False, inplace=True)
df_workflow['Weight'] = 1

print(f"{df_workflow['Development workflows'].iloc[0]} is the most prevalent ({df_workflow['Frequency'].iloc[0]} out of {len(df)}) workflow patterns that accounts for {round(df_workflow['Frequency'].iloc[0]/len(df)*100,2)}%.")
df_pwc = df[df['Platforms'].str.contains('pwc')]
print(f"There are {round(len(df[df['Development workflows'].map(len) > 1])/len(df)*100,2)}% ({len(df[df['Development workflows'].map(len) > 1])} out of {len(df)}) non-PWC leaderboards with multiple workflow patterns.")
print(f'In {df_workflow["Development workflows"].iloc[0]}, {round(len(df_pwc)/df_workflow["Frequency"].iloc[0]*100,2)}% ({len(df_pwc)} out of {df_workflow["Frequency"].iloc[0]}) of the leaderboards are hosted on Papers With Code.')

statistics = {
    'Distribution': 'Leaderboards across Workflow Patterns',
    'Mean': np.mean(df_workflow['Frequency']),
    'Median': np.median(df_workflow['Frequency']),
    'IQR': df_workflow['Frequency'].quantile(0.75) - df_workflow['Frequency'].quantile(0.25),
    'Gini Coefficient': ineqpy.inequality.gini(data=df_workflow[df_workflow['Development workflows'] != 'Unknown'], income='Frequency', weights='Weight'),
}
if os.path.exists(path_meta / 'leaderboard_statistics.csv'):
    df_statistics = pd.read_csv(path_meta / 'leaderboard_statistics.csv')
else:
    df_statistics = pd.DataFrame()
df_statistics = pd.concat([df_statistics, pd.DataFrame([statistics])], ignore_index=True)
df_statistics.drop_duplicates(subset=['Distribution'], keep='last', inplace=True)
df_statistics.sort_values(by='Distribution', inplace=True)
df_statistics.to_csv(path_meta / 'leaderboard_statistics.csv', index=False)

df_workflow = df_workflow[df_workflow['Development workflows'] != 'Unknown']
df_workflow['Ratio'] = round(df_workflow['Frequency'] / len(df) * 100, 2)
fig = px.bar(
    x=df_workflow['Development workflows'], 
    y=df_workflow['Ratio'],
    text_auto=True,
    labels={'x': 'Deployment workflows', 'y': 'Leaderboard Percentage'},
)
fig.update_layout(
    width=1200,  # Set the width of the figure
    height=800,  # Set the height of the figure
)
fig.show()

Pattern 1 is the most prevalent (475 out of 721) workflow patterns that accounts for 65.88%.
There are 11.79% (85 out of 721) non-PWC leaderboards with multiple workflow patterns.
In Pattern 1, 93.89% (446 out of 475) of the leaderboards are hosted on Papers With Code.


In [22]:
df = pd.read_csv(path_meta / 'leaderboard_processed.csv')
print(f"{round(len(df[df['#Empty ranking dataframes (non-pwc)'].notna()])/len(df)*100,2)}% ({len(df[df['#Empty ranking dataframes (non-pwc)'].notna()])} out of {len(df)}) leaderboards have empty ranking dataframes.")
df['#Empty ranking dataframes (non-pwc)'].value_counts().reset_index(name='Frequency')

0.42% (3 out of 721) leaderboards have empty ranking dataframes.


Unnamed: 0,#Empty ranking dataframes (non-pwc),Frequency
0,25,1
1,Unknown,1
2,2,1


In [23]:
df = pd.read_csv(path_meta / 'leaderboard_processed.csv')

df['Release organizations'] = df['Release organizations'].apply(ast.literal_eval)
df_split = df.explode('Release organizations').groupby('Release organizations').size().reset_index(name='Frequency')
df_split['Weight'] = 1

statistics = {
    'Distribution': 'Leaderboards across Release Organizations',
    'Mean': np.mean(df_split['Frequency']),
    'Median': np.median(df_split['Frequency']),
    'IQR': df_split['Frequency'].quantile(0.75) - df_split['Frequency'].quantile(0.25),
    'Gini Coefficient': ineqpy.inequality.gini(data=df_split, income='Frequency', weights='Weight'),
}
if os.path.exists(path_meta / 'leaderboard_statistics.csv'):
    df_statistics = pd.read_csv(path_meta / 'leaderboard_statistics.csv')
else:
    df_statistics = pd.DataFrame()
df_statistics = pd.concat([df_statistics, pd.DataFrame([statistics])], ignore_index=True)
df_statistics.drop_duplicates(subset=['Distribution'], keep='last', inplace=True)
df_statistics.sort_values(by='Distribution', inplace=True)
df_statistics.to_csv(path_meta / 'leaderboard_statistics.csv', index=False)

df_top = df_split.sort_values(by='Frequency', ascending=False).head(10)
print(f"{df_top['Release organizations'].iloc[0]} stands out as the most prolific release organization among the {len(df_split['Release organizations'].unique())-1} identified organizations, contributing to a notable {round(df_top['Frequency'].iloc[0]/len(df)*100,2)}% ({df_top['Frequency'].iloc[0]} out of {len(df)}) leaderboards.")

df_top['Ratio'] = round(df_top['Frequency'] / len(df) * 100, 2)

fig = go.Figure(go.Bar(
        x=df_top['Frequency'],  # Values for the bar lengths
        y=df_top['Release organizations'],  # Categories for each bar
        orientation='h',  # Sets the bars to be horizontal
        text=df_top['Frequency'],  # Adds the values as text on each bar
        textposition='auto'  # Automatically positions the text on the bars
))
fig.update_layout(
        title=f'Number of Leaderboards across Release Organizations (Top 10)',
        xaxis_title='Leaderboard Number',
        yaxis_title='Publisher Name',
        yaxis_autorange='reversed'  # This line makes the bars go top-down
)
fig.update_layout(
    width=1200,  # Set the width of the figure
    height=800,  # Set the height of the figure
)
fig.show()


Papers With Code stands out as the most prolific release organization among the 253 identified organizations, contributing to a notable 61.44% (443 out of 721) leaderboards.


In [24]:
df = pd.read_csv(path_meta / 'leaderboard_processed.csv')
df['Display formats'] = df['Display formats'].apply(ast.literal_eval)

df_multiple = df[df['Display formats'].map(len) > 1]
print(f"{round(len(df_multiple)/len(df)*100,2)}% ({len(df_multiple)} out of {len(df)}) leaderboards support multiple display formats.")
display_format_rankable = ['Rankable Table', 'Rankable Bar Chart']
df_rankable = keep_rows_by_list_column(df, 'Display formats', display_format_rankable)
print(f"{round(len(df_rankable)/len(df)*100,2)}% ({len(df_rankable)} out of {len(df)}) leaderboards support rankable display formats.")
df_rankable_split = df_rankable.explode('Display formats')['Display formats'].value_counts().reset_index(name='Frequency')
print(f"{df_rankable_split['Display formats'].iloc[0]} is the most popular display format of rankable leaderboards, accounting for {round(df_rankable_split['Frequency'].iloc[0]/len(df_rankable)*100,2)}% ({df_rankable_split['Frequency'].iloc[0]} out of {len(df_rankable)}) rankable leaderboards.")
df_split = df.explode('Display formats')['Display formats'].value_counts().reset_index(name='Frequency')
df_split['Weight'] = 1

statistics = {
    'Distribution': 'Leaderboards across Display Formats',
    'Mean': np.mean(df_split['Frequency']),
    'Median': np.median(df_split['Frequency']),
    'IQR': df_split['Frequency'].quantile(0.75) - df_split['Frequency'].quantile(0.25),
    'Gini Coefficient': ineqpy.inequality.gini(data=df_split, income='Frequency', weights='Weight'),
}
if os.path.exists(path_meta / 'leaderboard_statistics.csv'):
    df_statistics = pd.read_csv(path_meta / 'leaderboard_statistics.csv')
else:
    df_statistics = pd.DataFrame()
df_statistics = pd.concat([df_statistics, pd.DataFrame([statistics])], ignore_index=True)
df_statistics.drop_duplicates(subset=['Distribution'], keep='last', inplace=True)
df_statistics.sort_values(by='Distribution', inplace=True)
df_statistics.to_csv(path_meta / 'leaderboard_statistics.csv', index=False)

df_split['Ratio'] = round(df_split['Frequency'] / len(df) * 100, 2)

fig = px.bar(
    x=df_split['Display formats'],
    y=df_split['Frequency'],
    text_auto=True,
    labels={'x': 'Display format', 'y': 'Number of Leaderboards'},
)
# Update the layout for a tighter look
fig.update_layout(
    autosize=True,
    margin=dict(
        l=10,  # Left margin
        r=10,  # Right margin
        b=10,  # Bottom margin
        t=10,  # Top margin
        pad=4  # Padding between the plot and the margin
    )
)
fig.update_layout(
    width=1200,  # Set the width of the figure
    height=800,  # Set the height of the figure
)
fig.show()

75.45% (544 out of 721) leaderboards support multiple display formats.
88.9% (641 out of 721) leaderboards support rankable display formats.
Rankable Table is the most popular display format of rankable leaderboards, accounting for 99.84% (640 out of 641) rankable leaderboards.


In [25]:
df = pd.read_csv(path_meta / 'leaderboard_processed.csv')
df = df[df['Platforms'] != 'pwc']
df['Publication venues (non-pwc)'] = df['Publication venues (non-pwc)'].apply(ast.literal_eval)
df_pub = df[df['Publication venues (non-pwc)'].apply(len) > 0]
print(f"{round(len(df_pub)/len(df)*100,2)}% ({len(df_pub)} out of {len(df)}) leaderboards are associated with specific publications, including research articles, blog posts, and white papers.")

df_literature = filter_rows_by_list_column(df_pub, 'Publication venues (non-pwc)', non_accepted_publication_type)
print(f"{round(len(df_literature)/len(df_pub)*100,2)}% ({len(df_literature)} out of {len(df_pub)}) publications have been accepted in a specific workshop, conference, magzine, or journal.")
df_split = df_literature.explode('Publication venues (non-pwc)').groupby('Publication venues (non-pwc)').size().reset_index(name='Frequency')
df_split['Weight'] = 1

statistics = {
    'Distribution': 'Leaderboards across Publication Venues',
    'Mean': np.mean(df_split['Frequency']),
    'Median': np.median(df_split['Frequency']),
    'IQR': df_split['Frequency'].quantile(0.75) - df_split['Frequency'].quantile(0.25),
    'Gini Coefficient': ineqpy.inequality.gini(data=df_split, income='Frequency', weights='Weight'),
}
if os.path.exists(path_meta / 'leaderboard_statistics.csv'):
    df_statistics = pd.read_csv(path_meta / 'leaderboard_statistics.csv')
else:
    df_statistics = pd.DataFrame()
df_statistics = pd.concat([df_statistics, pd.DataFrame([statistics])], ignore_index=True)
df_statistics.drop_duplicates(subset=['Distribution'], keep='last', inplace=True)
df_statistics.sort_values(by='Distribution', inplace=True)
df_statistics.to_csv(path_meta / 'leaderboard_statistics.csv', index=False)

df_top = df_split.sort_values(by='Frequency', ascending=False).head(10)
print(f"{df_top['Publication venues (non-pwc)'].iloc[0]} emerges as the conference with the most number of accepted publications, accounting for {round(df_top['Frequency'].iloc[0]/len(df_literature)*100,2)}% ({df_top['Frequency'].iloc[0]} out of {len(df_literature)}) of those published.")

df_top['Ratio'] = round(df_top['Frequency'] / len(df_literature) * 100, 2)

fig = go.Figure(go.Bar(
        x=df_top['Frequency'],  # Values for the bar lengths
        y=df_top['Publication venues (non-pwc)'],  # Categories for each bar
        orientation='h',  # Sets the bars to be horizontal
        text=df_top['Frequency'],  # Adds the values as text on each bar
        textposition='auto'  # Automatically positions the text on the bars
))
fig.update_layout(
        title=f'Number of non-PWC Leaderboards with Accepted Publications across Publication Venues (Top 10)',
        xaxis_title='Leaderboard Number',
        yaxis_title='Publication Name',
        yaxis_autorange='reversed'  # This line makes the bars go top-down
)
fig.update_layout(
    width=1200,  # Set the width of the figure
    height=800,  # Set the height of the figure
)
fig.show()


71.22% (198 out of 278) leaderboards are associated with specific publications, including research articles, blog posts, and white papers.
32.32% (64 out of 198) publications have been accepted in a specific workshop, conference, magzine, or journal.
NeurIPS emerges as the conference with the most number of accepted publications, accounting for 21.88% (14 out of 64) of those published.


In [26]:
df = pd.read_csv(path_meta / 'leaderboard_processed.csv')
print(f"{round((len(df)-len(leaderboard_system_without_documentation))/(len(df))*100, 2)}% ({len(df)-len(leaderboard_system_without_documentation)} out of {len(df)}) leaderboards provide documentation.")
print(f"{round((len(df)-len(leaderboard_system_without_contacts))/(len(df))*100, 2)}% ({len(df)-len(leaderboard_system_without_contacts)} out of {len(df)}) leaderboards provide contact information.")
df['Development workflows'] = df['Development workflows'].apply(ast.literal_eval)
df_submission = keep_rows_by_list_column(df, 'Development workflows', workflow_patterns_with_submission)
print(f"{round(len(df_submission)/(len(df))*100, 2)}% ({len(df_submission)} out of {len(df)}) leaderboards provide submission channels.")
df_pwc = df[df['Platforms'] == 'pwc']
print(f"{round((len(df)-len(leaderboard_system_without_evaluation_harness)-len(df_pwc))/(len(df))*100, 2)}% ({len(df)-len(leaderboard_system_without_evaluation_harness)-len(df_pwc)} out of {len(df)}) leaderboards provide evaluation harness.")
print(f"{round((len(df)-len(leaderboard_system_without_pull_requests)-len(df_pwc))/(len(df))*100, 2)}% ({len(df)-len(leaderboard_system_without_pull_requests)-len(df_pwc)} out of {len(df)}) leaderboards provide pull request channels.")
print(f"{round((len(df)-len(leaderboard_system_without_pull_requests)-len(df_pwc))/(len(df))*100, 2)}% ({len(df)-len(leaderboard_system_without_pull_requests)-len(df_pwc)} out of {len(df)}) leaderboards provide discussion forums.")

99.86% (720 out of 721) leaderboards provide documentation.
99.86% (720 out of 721) leaderboards provide contact information.
100.0% (721 out of 721) leaderboards provide submission channels.
38.42% (277 out of 721) leaderboards provide evaluation harness.
36.75% (265 out of 721) leaderboards provide pull request channels.
36.75% (265 out of 721) leaderboards provide discussion forums.


In [27]:
df = pd.read_csv(path_meta / 'leaderboard_statistics.csv')
df.fillna('$\\times$', inplace=True)
df['Mean'] = df['Mean'].map('{:.2f}'.format)
df['Median'] = df['Median'].map('{:.1f}'.format)
df['IQR'] = df['IQR'].map('{:.0f}'.format)
df['Gini Coefficient'] = df['Gini Coefficient'].map(lambda x: '{:.3f}'.format(x) if isinstance(x,float) else x)
print(df.to_latex(index=False))

\begin{tabular}{lllll}
\toprule
Distribution & Mean & Median & IQR & Gini Coefficient \\
\midrule
Leaderboards across Display Formats & 117.73 & 7.0 & 71 & 0.853 \\
Leaderboards across Publication Venues & 3.14 & 1.5 & 3 & 0.517 \\
Leaderboards across Release Organizations & 4.69 & 1.0 & 2 & 0.718 \\
Leaderboards across Workflow Patterns & 161.80 & 77.0 & 220 & 0.722 \\
\bottomrule
\end{tabular}



In [28]:
total_smell_count = 0

# Load the Excel file
with pd.ExcelFile(path_meta / 'Foundation Model Leaderboards.xlsx') as xls:

    # Initialize a dictionary to store unique counts
    unique_counts = {}

    # Iterate over each sheet
    for sheet_name in xls.sheet_names:
        if sheet_name in ['Leaderboard']:
            continue
        
        df = pd.read_excel(xls, sheet_name=sheet_name)
        
        if sheet_name == 'Self-admitted Technical Debt':
            print(f'There are {len(df)+1} SATD examples.')
            continue
    
        # Iterate over each column
        for column in df.columns:
            unique_count = df[column].dropna().nunique()
        
            if sheet_name not in unique_counts:
                unique_counts[sheet_name] = {}
                
            unique_counts[sheet_name][column] = unique_count
            total_smell_count += unique_count

print(f'There are {total_smell_count} leaderboard smell examples.')

# Display the result
result_df = pd.DataFrame(unique_counts).transpose()
result_df = result_df.fillna('')
result_df = result_df.map(lambda x: int(x) if isinstance(x, float) else x)
result_df

There are 34 SATD examples.
There are 320 leaderboard smell examples.


Unnamed: 0,Benchmark Metric,Benchmark Protocol,Benchmark Raw Dataset,Evaluation Record/Result,Model (Information),Ranking Dataframe,Submission Channel/Guideline,Benchmark Task,Uncategorized
Confusing Entity,4.0,10.0,24.0,11.0,7.0,4.0,21.0,,
Deprecated Entity,,,3.0,1.0,1.0,7.0,3.0,,
Inaccessible Entity,,,2.0,3.0,1.0,13.0,7.0,,
Misdisplayed Entity,5.0,2.0,,,,3.0,,,
Mismatched Entity,3.0,1.0,2.0,2.0,6.0,3.0,,2.0,
Missing Entity,,1.0,,7.0,,15.0,1.0,,
Redundant Entity,,,,3.0,2.0,4.0,,,
Unresponsive Entity,,,,,,103.0,3.0,,
Others,,,,,,,,,30.0
