The model card template makes use of Jinja, hence we need to install the necessary package.

In [4]:
!pip install Jinja2

Defaulting to user installation because normal site-packages is not writeable


Required import statement

In [5]:
from huggingface_hub import ModelCard, ModelCardData

Before running the cell below, upload the model card template (`COMP34812_modelcard_template.md`) provided to you using the Colab file browser (on the left-hand side).

In [None]:
card_data = ModelCardData(
    language='en',
    license='cc-by-4.0',
    tags=['text-classification'],
    # change the line below to specify the URL to your Github/Gitlab repo
    repo="https://github.com/AAP9002/COMP34812-NLU-NLI",
    ignore_metadata_errors=True)

card = ModelCard.from_template(
    card_data = card_data,
    template_path='COMP34812_modelcard_template.md',
    # change the following line to indicate your respective usernames
    # and the abbreviation of the relevant track name, e.g., NLI, ED, AV
    model_id = 'z72819ap-e91802zc-NLI',
    base_model_repo = 'https://huggingface.co/FacebookAI/roberta-base',
    base_model_paper = 'https://arxiv.org/abs/1907.11692',
    base_model = 'roberta-base',
    model_architecture = 'Transformers',
    model_type = 'Supervised',
    language = 'English',
    model_summary = '''This is a classification model that was trained to detect whether a premise and hypothesis entail each other or not, using binary classification.''',
    developers = 'Alan Prophett and Zac Curtis',
    testing_data = 'A subset of the development set provided, amounting to 6K+ pairs.',
    hyperparameters = '''
    All Models and datasets
      - seed: 42

    Roberta Large NLI Binary Classification Model
      - learning_rate: 2e-05
      - train_batch_size: 16
      - eval_batch_size: 16
      - num_epochs: 5

    Semantic Textual Similarity Binary Classification Model
      - learning_rate: 2e-05
      - train_batch_size: 16
      - eval_batch_size: 16
      - num_epochs: 5

    Ensemble Meta Model
      - learning_rate: 2e-05
      - train_batch_size: 128
      - eval_batch_size: 16
      - num_epochs: 3
      ''',
    testing_metrics = '''
      - Precision
      - Recall
      - F1-score
      - Accuracy''',
    results = 'The Ensemble Model obtained an F1-score of 91% and an accuracy of 91%.',
    speeds_sizes_times = '''
      - overall training time: 309 minutes 30 seconds

    Roberta Large NLI Binary Classification Model
      - duration per training epoch: 11 minutes
      - model size: 1.42 GB

    Semantic Textual Similarity Binary Classification Model
      - duration per training epoch: 4 minutes 30 seconds
      - model size: 501 MB

    Ensamble Meta Model
      - duration per training epoch: 4 minutes
      - model size: 1.92 GB''',
    model_description = '''This model is based upon a ensemble of RoBERTa models that was fine-tuned using over 24K premise-hypothesis pairs from the shared task dataset for Natural Language Inference (NLI).''',
    hardware_requirements = '''
      - RAM: at least 10 GB
      - Storage: at least 4GB,
      - GPU: a100 40GB''',
    software = '''
      - Tensorflow 2.18.0+cu12.4
      - Transformers 4.50.3
      - Pandas 2.2.2
      - NumPy 2.0.2
      - Seaborn 0.13.2
      - Huggingface_hub 0.30.1
      - Matplotlib 3.10.0
      - Scikit-learn 1.6.1''',
    bias_risks_limitations = '''Any inputs (concatenation of two sequences) longer than
      512 subwords will be truncated by the model.''',
    additional_information = '''The hyperparameters were determined by experimentation
      with different values.''',
    training_data = '24K+ premise-hypothesis pairs from the shared task dataset provided for Natural Language Inference (NLI).',
)

# the following lines will write a markdown (.md) file; this becomes one of your model cards
# change the filename accordingly
with open('my_model_card.md', 'w') as model_card:
  model_card.write(card.content)

Repo card metadata block was not found. Setting CardData to empty.
