# Model table

Small notebook for unifying the table with info of models, export to excel to edit and add it to the paper (Used to generate the table 1 of the manuscript)

In [4]:
import pandas as pd
from pathlib import Path

derivatives_folder = Path("../derivatives")
metadata_folder = derivatives_folder / "metadata"
models_info_filename = metadata_folder / "models-info.csv"
model_sizes_filename = metadata_folder / "model_sizes.csv"

In [None]:
model_info = pd.read_csv(models_info_filename)
model_sizes = pd.read_csv(model_sizes_filename).rename(columns={"model": "model_name"})
df = model_info.merge(model_sizes, on="model_name")
df["training"] = ""
df = df[["modality", "family", "training", "model", "num_parameters", "num_layers", "inner_dim", "model_name"]]
df = df.sort_values(["modality", "family", "num_parameters"], ascending=[False, True, True])
df.modality = df.modality.str.capitalize()


# Format sizes if billions format as X.XB, if millions format as XM
def format_size(x):
    if x >= 1e9:
        return f"{x / 1e9:.1f}B"
    elif x >= 1e6:
        return f"{x / 1e6:.0f}M"
    else:
        return str(x)
    
df.num_parameters = df.num_parameters.apply(format_size)
df.num_parameters = df.num_parameters.astype(str).str.replace(".0", "", regex=False)
df.family = df.family.replace({
    'Clip': 'CLIP (Vision)', # CLIP ViT https://arxiv.org/pdf/2212.07143
    'Clip-FT': 'CLIP (Vision)',
    'AugReg': 'ViT (AugReg)', # Augreg: https://arxiv.org/pdf/2106.10270
    'BloomZ': 'BLOOMZ',
    'Gemma-2': 'Gemma 2',
    'Huggyllama': 'LLaMA',
    'Llama-3': 'LLaMA 3',
    'Llama-3.1': 'LLaMA 3',
    'Open-Llama': 'LLaMA', # OpenLLaMA
})

#df.to_excel("models-info.xlsx", index=False)
df


Unnamed: 0,modality,family,training,model,num_parameters,num_layers,inner_dim,model_name
30,Vision,ViT (AugReg),,AugReg-ViT-tiny,10M,12,192,vit_tiny_patch16_224.augreg_in21k_pool-cls
29,Vision,ViT (AugReg),,AugReg-ViT-small,30M,12,384,vit_small_patch16_224.augreg_in21k_pool-cls
15,Vision,ViT (AugReg),,AugReg-ViT-base,103M,12,768,vit_base_patch16_224.augreg_in21k_pool-cls
26,Vision,ViT (AugReg),,AugReg-ViT-large,326M,24,1024,vit_large_patch16_224.augreg_in21k_pool-cls
18,Vision,CLIP (Vision),,CLIP-ViT-base,86M,12,768,vit_base_patch16_clip_224.laion2b_pool-cls
24,Vision,CLIP (Vision),,CLIP-ViT-large,304M,24,1024,vit_large_patch14_clip_224.laion2b_pool-cls
22,Vision,CLIP (Vision),,CLIP-ViT-huge,632M,32,1280,vit_huge_patch14_clip_224.laion2b_pool-cls
17,Vision,CLIP (Vision),,CLIP-ViT-base-FT,95M,12,768,vit_base_patch16_clip_224.laion2b_ft_in12k_poo...
23,Vision,CLIP (Vision),,CLIP-ViT-large-FT,315M,24,1024,vit_large_patch14_clip_224.laion2b_ft_in12k_po...
21,Vision,CLIP (Vision),,CLIP-ViT-huge-FT,646M,32,1280,vit_huge_patch14_clip_224.laion2b_ft_in12k_poo...
