In [3]:
import json


# List of JSON files to process
json_files = [
    "./model_analysis_type_question-answering_min_dl_1000_lib_transformers.json",
    "./model_analysis_type_text-classification_min_dl_1000_lib_transformers.json", 
    "./model_analysis_type_text-generation_min_dl_1000_lib_transformers.json",
    "./model_analysis_type_token-classification_min_dl_1000_lib_transformers.json"
]

# Dictionary to store all models and their dependencies across files
all_model_dependencies = {}
models_with_version_info = {}

# Process each JSON file
for json_file in json_files:
    try:
        with open(json_file, 'r') as f:
            data = json.load(f)
            
        # Process models in current file
        for model in data:
            model_id = model['model_id']
            deps = model.get('dependencies', [])
            
            if deps:
                all_model_dependencies[model_id] = []
                has_non_null_version = False
                
                for dep in deps:
                    if len(dep) == 2:
                        library, version = dep
                        all_model_dependencies[model_id].append((library, version))
                        if version is not None:
                            has_non_null_version = True
                
                if has_non_null_version:
                    models_with_version_info[model_id] = all_model_dependencies[model_id]
                    
    except FileNotFoundError:
        print(f"Warning: Could not find file {json_file}")
    except json.JSONDecodeError:
        print(f"Warning: Error parsing JSON from {json_file}")
    except Exception as e:
        print(f"Warning: Unexpected error processing {json_file}: {str(e)}")

print("\nAll models and their dependencies across all files:")
for model_id, deps in all_model_dependencies.items():
    print(f"\nModel: {model_id}")
    for lib, version in deps:
        version_str = version if version is not None else "null"
        print(f"  {lib}: {version_str}")

print("\nModels with non-null version dependencies across all files:")
for model_id, deps in models_with_version_info.items():
    print(f"\nModel: {model_id}")
    for lib, version in deps:
        version_str = version if version is not None else "null"
        print(f"  {lib}: {version_str}")






All models and their dependencies across all files:

Model: deepset/roberta-base-squad2
  haystack-ai: null
  transformers: null

Model: distilbert/distilbert-base-cased-distilled-squad
  transformers: null

Model: sjrhuschlee/flan-t5-large-squad2
  transformers: null
  torch: null
  peft: null

Model: google-bert/bert-large-uncased-whole-word-masking-finetuned-squad
  torch: null

Model: deepset/bert-large-uncased-whole-word-masking-squad2
  haystack-ai: null
  transformers: null

Model: deepset/minilm-uncased-squad2
  haystack-ai: null
  transformers: null

Model: distilbert/distilbert-base-uncased-distilled-squad
  transformers: null

Model: google-bert/bert-large-cased-whole-word-masking-finetuned-squad
  torch: null

Model: csarron/mobilebert-uncased-squad-v2
  transformers: null

Model: SmallDoge/Doge-160M-Instruct
  transformers: null
  trl: null

Model: deepset/bert-base-cased-squad2
  haystack-ai: null
  transformers: null

Model: deepset/roberta-large-squad2
  transformers: 

In [1]:
# Code Block 1: Praise2112/ModernBERT-base-squad2-v0.2
!pip install transformers==4.48.0 torch==2.5.1 datasets==2.20.0 tokenizers==0.21.0


Defaulting to user installation because normal site-packages is not writeable
Collecting transformers==4.48.0
  Using cached transformers-4.48.0-py3-none-any.whl.metadata (44 kB)
Collecting torch==2.5.1
  Using cached torch-2.5.1-cp39-cp39-manylinux1_x86_64.whl.metadata (28 kB)
Collecting datasets==2.20.0
  Using cached datasets-2.20.0-py3-none-any.whl.metadata (19 kB)
Collecting tokenizers==0.21.0
  Using cached tokenizers-0.21.0-cp39-abi3-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (6.7 kB)
Collecting huggingface-hub<1.0,>=0.24.0 (from transformers==4.48.0)
  Downloading huggingface_hub-0.29.3-py3-none-any.whl.metadata (13 kB)
Collecting nvidia-cuda-nvrtc-cu12==12.4.127 (from torch==2.5.1)
  Using cached nvidia_cuda_nvrtc_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)
Collecting nvidia-cuda-runtime-cu12==12.4.127 (from torch==2.5.1)
  Using cached nvidia_cuda_runtime_cu12-12.4.127-py3-none-manylinux2014_x86_64.whl.metadata (1.5 kB)
Collecting nvidia-cud

In [1]:
from transformers import AutoModelForQuestionAnswering, AutoTokenizer

model_name = "Praise2112/ModernBERT-base-squad2-v0.2"
model = AutoModelForQuestionAnswering.from_pretrained(model_name, trust_remote_code=True)
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)

question = "What is dependency conflict?"
context = "Dependency conflicts occur when different packages require different versions of the same dependency."
inputs = tokenizer(question, context, return_tensors="pt")
outputs = model(**inputs)
print(outputs)


modelling.py:   0%|          | 0.00/4.97k [00:00<?, ?B/s]

A new version of the following files was downloaded from https://huggingface.co/Praise2112/ModernBERT-base-squad2-v0.2:
- modelling.py
. Make sure to double-check they do not contain any added malicious code. To avoid downloading new versions of the code file, you can pin a revision.


RuntimeError: Failed to import transformers.models.modernbert.modeling_modernbert because of the following error (look up to see its traceback):
operator torchvision::nms does not exist

In [2]:
!pip uninstall -y torch torchvision torchaudio xformers aiofiles markupsafe urllib3 gradio
!pip install torch==2.2.0
!pip install torchvision==0.17.0
!pip install facenet-pytorch==2.6.0
!pip install gradio==4.44.1 aiofiles==23.1.0 markupsafe==2.1.1 urllib3==2.0.4

Found existing installation: torch 2.5.1
Uninstalling torch-2.5.1:
  Successfully uninstalled torch-2.5.1
Found existing installation: torchvision 0.21.0+cpu
Uninstalling torchvision-0.21.0+cpu:
  Successfully uninstalled torchvision-0.21.0+cpu
Found existing installation: torchaudio 2.5.0
Uninstalling torchaudio-2.5.0:
  Successfully uninstalled torchaudio-2.5.0
Found existing installation: xformers 0.0.20
Uninstalling xformers-0.0.20:
  Successfully uninstalled xformers-0.0.20
Found existing installation: aiofiles 24.1.0
Uninstalling aiofiles-24.1.0:
  Successfully uninstalled aiofiles-24.1.0
Found existing installation: MarkupSafe 3.0.2
Uninstalling MarkupSafe-3.0.2:
  Successfully uninstalled MarkupSafe-3.0.2
Found existing installation: urllib3 1.26.18
Uninstalling urllib3-1.26.18:
  Successfully uninstalled urllib3-1.26.18
Found existing installation: gradio 4.44.1
Uninstalling gradio-4.44.1:
  Successfully uninstalled gradio-4.44.1
Defaulting to user installation because normal 

In [1]:
from transformers import AutoModelForQuestionAnswering, AutoTokenizer

model_name = "Praise2112/ModernBERT-base-squad2-v0.2"
model = AutoModelForQuestionAnswering.from_pretrained(model_name, trust_remote_code=True)
tokenizer = AutoTokenizer.from_pretrained(model_name, trust_remote_code=True)

question = "What is dependency conflict?"
context = "Dependency conflicts occur when different packages require different versions of the same dependency."
inputs = tokenizer(question, context, return_tensors="pt")
outputs = model(**inputs)
print(outputs)


2025-03-23 23:07:37.416815: I tensorflow/core/util/port.cc:153] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2025-03-23 23:07:37.921221: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:477] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
E0000 00:00:1742771258.108561   12686 cuda_dnn.cc:8310] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
E0000 00:00:1742771258.164793   12686 cuda_blas.cc:1418] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
2025-03-23 23:07:38.659088: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instr

model.safetensors:   0%|          | 0.00/598M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/21.1k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/3.58M [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/694 [00:00<?, ?B/s]

QuestionAnsweringModelOutput(loss=None, start_logits=tensor([[ 9.7704, -0.7821, -4.7557,  3.2676, -4.0456,  3.1307,  4.5291,  9.4809,
          5.5877,  5.9925, 10.8607, 11.0336,  8.9084,  9.2726, 10.1642,  8.9332,
          4.6125,  8.3634,  7.5077,  7.6692,  6.9890,  2.9429]],
       grad_fn=<CloneBackward0>), end_logits=tensor([[ 9.1559, -0.5290, -0.2660,  1.9820, -1.3602,  3.3938,  4.8155,  6.6853,
          6.7588,  5.6995,  2.7776,  2.5640,  5.8419,  5.5150,  5.5985,  9.5415,
          5.1540,  5.0208,  8.4263, 12.6687, 11.1534,  0.6344]],
       grad_fn=<CloneBackward0>), hidden_states=None, attentions=None)


# electra_large_discriminator_squad2_512

In [10]:
!pip install transformers==2.11.0 torch==1.5.0 tensorflow==2.2.0

from transformers import AutoModelForQuestionAnswering, AutoTokenizer

model_name = "ahotrod/electra_large_discriminator_squad2_512"
model = AutoModelForQuestionAnswering.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

question = "Explain version conflicts in dependency management."
context = "Version conflicts can cause errors during package installation or runtime execution."
inputs = tokenizer(question, context, return_tensors="pt")
outputs = model(**inputs)
print(outputs)


Defaulting to user installation because normal site-packages is not writeable
Collecting transformers==2.11.0
  Downloading transformers-2.11.0-py3-none-any.whl.metadata (45 kB)
[31mERROR: Could not find a version that satisfies the requirement torch==1.5.0 (from versions: 1.7.1, 1.8.0, 1.8.1, 1.9.0, 1.9.1, 1.10.0, 1.10.1, 1.10.2, 1.11.0, 1.12.0, 1.12.1, 1.13.0, 1.13.1, 2.0.0, 2.0.1, 2.1.0, 2.1.1, 2.1.2, 2.2.0, 2.2.1, 2.2.2, 2.3.0, 2.3.1, 2.4.0, 2.4.1, 2.5.0, 2.5.1, 2.6.0)[0m[31m
[0m[31mERROR: No matching distribution found for torch==1.5.0[0m[31m
[0m

config.json:   0%|          | 0.00/475 [00:00<?, ?B/s]

Unexpected exception formatting exception. Falling back to standard exception


Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/transformers/utils/import_utils.py", line 1126, in _get_module
    # Parse it and check the field "sagemaker_distributed_dataparallel_enabled".
  File "/usr/lib64/python3.9/importlib/__init__.py", line 127, in import_module
    return _bootstrap._gcd_import(name[level:], package, level)
  File "<frozen importlib._bootstrap>", line 1030, in _gcd_import
  File "<frozen importlib._bootstrap>", line 1007, in _find_and_load
  File "<frozen importlib._bootstrap>", line 984, in _find_and_load_unlocked
ModuleNotFoundError: No module named 'transformers.models.ernie_m.configuration_ernie_m'

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/IPython/core/interactiveshell.py", line 3550, in run_code
    exec(code_obj, self.user_global_ns, self.user_ns)
  File "/tmp/ipykernel_13607/713093529.py"

In [4]:
!pip uninstall -y torch 
!pip install transformers==2.11.0 torch==1.7.1 tensorflow==2.5.0

huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
Defaulting to user installation because normal site-packages is not writeable
Collecting transformers==2.11.0
  Using cached transformers-2.11.0-py3-none-any.whl (674 kB)
Collecting torch==1.7.1
  Using cached torch-1.7.1-cp39-cp39-manylinux1_x86_64.whl (776.8 MB)
Collecting tensorflow==2.5.0
  Downloading tensorflow-2.5.0-cp39-cp39-manylinux2010_x86_64.whl (454.4 MB)
     |████████████████████████████████| 454.4 MB 16 kB/s       

In [5]:
from transformers import AutoModelForQuestionAnswering, AutoTokenizer

model_name = "ahotrod/electra_large_discriminator_squad2_512"
model = AutoModelForQuestionAnswering.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

question = "Explain version conflicts in dependency management."
context = "Version conflicts can cause errors during package installation or runtime execution."
inputs = tokenizer(question, context, return_tensors="pt")
outputs = model(**inputs)
print(outputs)

Downloading:   0%|          | 0.00/475 [00:00<?, ?B/s]

RuntimeError: Failed to import transformers.models.lxmert.configuration_lxmert because of the following error (look up to see its traceback):
No module named 'transformers.models.lxmert.configuration_lxmert'

In [11]:
# Code Block 3: bigwiz83/sapbert-from-pubmedbert-squad2
!pip install transformers==4.7.0 torch==1.8.0 datasets==1.4.1 tokenizers==0.10.2

from transformers import AutoModelForQuestionAnswering, AutoTokenizer

model_name = "bigwiz83/sapbert-from-pubmedbert-squad2"
model = AutoModelForQuestionAnswering.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

question = "What issues arise from dependency conflicts?"
context = "When multiple libraries require conflicting versions, errors are likely to happen."
inputs = tokenizer(question, context, return_tensors="pt")
outputs = model(**inputs)
print(outputs)


Defaulting to user installation because normal site-packages is not writeable
Collecting transformers==4.7.0
  Downloading transformers-4.7.0-py3-none-any.whl.metadata (48 kB)
Collecting torch==1.8.0
  Using cached torch-1.8.0-cp39-cp39-manylinux1_x86_64.whl.metadata (23 kB)
Collecting datasets==1.4.1
  Downloading datasets-1.4.1-py3-none-any.whl.metadata (8.7 kB)
Collecting tokenizers==0.10.2
  Downloading tokenizers-0.10.2-cp39-cp39-manylinux2010_x86_64.whl.metadata (5.8 kB)
Collecting huggingface-hub==0.0.8 (from transformers==4.7.0)
  Downloading huggingface_hub-0.0.8-py3-none-any.whl.metadata (8.7 kB)
Collecting sacremoses (from transformers==4.7.0)
  Downloading sacremoses-0.1.1-py3-none-any.whl.metadata (8.3 kB)
Collecting tqdm>=4.27 (from transformers==4.7.0)
  Downloading tqdm-4.49.0-py2.py3-none-any.whl.metadata (55 kB)
INFO: pip is looking at multiple versions of datasets to determine which version is compatible with other requirements. This could take a while.
[31mERROR: C

config.json:   0%|          | 0.00/642 [00:00<?, ?B/s]

Unexpected exception formatting exception. Falling back to standard exception


Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/transformers/utils/import_utils.py", line 1126, in _get_module
    # Parse it and check the field "sagemaker_distributed_dataparallel_enabled".
  File "/usr/lib64/python3.9/importlib/__init__.py", line 127, in import_module
    return _bootstrap._gcd_import(name[level:], package, level)
  File "<frozen importlib._bootstrap>", line 1030, in _gcd_import
  File "<frozen importlib._bootstrap>", line 1007, in _find_and_load
  File "<frozen importlib._bootstrap>", line 984, in _find_and_load_unlocked
ModuleNotFoundError: No module named 'transformers.models.ernie_m.configuration_ernie_m'

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/IPython/core/interactiveshell.py", line 3550, in run_code
    exec(code_obj, self.user_global_ns, self.user_ns)
  File "/tmp/ipykernel_13607/328999849.py"

In [2]:
!pip uninstall -y transformers datasets huggingface-hub tokenizers
!pip install transformers==4.7.0
!pip install datasets==1.6.0
!pip install tokenizers==0.10.2
!pip install huggingface-hub==0.0.8

huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Found existing installation: transformers 4.48.0
Uninstalling transformers-4.48.0:
  Successfully uninstalled transformers-4.48.0
Found existing installation: datasets 2.20.0
Uninstalling datasets-2.20.0:
  Successfully uninstalled datasets-2.20.0
Found existing installation: huggingface-hub 0.29.3
Uninstalling huggingface-hub-0.29.3:
  Successfully uninstalled huggingface-hub-0.29.3
Found existing installation: tokenizers 0.21.0
Uninstalling tokenizers-0.21.0:
  Successfully uninstalled tokenizers-0.21.0


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Defaulting to user installation because normal site-packages is not writeable
Collecting transformers==4.7.0
  Using cached transformers-4.7.0-py3-none-any.whl.metadata (48 kB)
Collecting huggingface-hub==0.0.8 (from transformers==4.7.0)
  Using cached huggingface_hub-0.0.8-py3-none-any.whl.metadata (8.7 kB)
Collecting tokenizers<0.11,>=0.10.1 (from transformers==4.7.0)
  Using cached tokenizers-0.10.3-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl.metadata (5.8 kB)
Downloading transformers-4.7.0-py3-none-any.whl (2.5 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m2.5/2.5 MB[0m [31m46.4 MB/s[0m eta [36m0:00:00[0m
[?25hDownloading huggingface_hub-0.0.8-py3-none-any.whl (34 kB)
Using cached tokenizers-0.10.3-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (3.3 MB)
Installing collected packages: tokenizers, huggingface-hub, transformers
[31mERROR: pip's dependency res

huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Defaulting to user installation because normal site-packages is not writeable
Collecting datasets==1.6.0
  Downloading datasets-1.6.0-py3-none-any.whl.metadata (8.9 kB)
Collecting tqdm<4.50.0,>=4.27 (from datasets==1.6.0)
  Using cached tqdm-4.49.0-py2.py3-none-any.whl.metadata (55 kB)
Downloading datasets-1.6.0-py3-none-any.whl (202 kB)
Downloading tqdm-4.49.0-py2.py3-none-any.whl (69 kB)
Installing collected packages: tqdm, datasets
  Attempting uninstall: tqdm
    Found existing installation: tqdm 4.66.5
    Uninstalling tqdm-4.66.5:
      Successfully uninstalled tqdm-4.66.5
[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.
evaluate 0.4.3 requires datasets>=2.0.0, but you have datasets 1.6.0 which is incompatible.
evaluate 0.4.3 requires huggingface-hub>=0.7.0, but you have huggingface-hub 0.0.8 which is incompatible.
evaluate 0.4.3 requires tqdm>=4.62.1

huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Defaulting to user installation because normal site-packages is not writeable
Collecting tokenizers==0.10.2
  Using cached tokenizers-0.10.2-cp39-cp39-manylinux2010_x86_64.whl.metadata (5.8 kB)
Downloading tokenizers-0.10.2-cp39-cp39-manylinux2010_x86_64.whl (3.3 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m3.3/3.3 MB[0m [31m27.3 MB/s[0m eta [36m0:00:00[0m
[?25hInstalling collected packages: tokenizers
  Attempting uninstall: tokenizers
    Found existing installation: tokenizers 0.10.3
    Uninstalling tokenizers-0.10.3:
      Successfully uninstalled tokenizers-0.10.3
Successfully installed tokenizers-0.10.2


huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Defaulting to user installation because normal site-packages is not writeable


In [1]:
from transformers import AutoModelForQuestionAnswering, AutoTokenizer

model_name = "bigwiz83/sapbert-from-pubmedbert-squad2"
model = AutoModelForQuestionAnswering.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

question = "What issues arise from dependency conflicts?"
context = "When multiple libraries require conflicting versions, errors are likely to happen."
inputs = tokenizer(question, context, return_tensors="pt")
outputs = model(**inputs)
print(outputs)

HBox(children=(FloatProgress(value=0.0, description='Downloading', max=642.0, style=ProgressStyle(description_…




HBox(children=(FloatProgress(value=0.0, description='Downloading', max=435660911.0, style=ProgressStyle(descri…




HBox(children=(FloatProgress(value=0.0, description='Downloading', max=226150.0, style=ProgressStyle(descripti…




HBox(children=(FloatProgress(value=0.0, description='Downloading', max=460875.0, style=ProgressStyle(descripti…




HBox(children=(FloatProgress(value=0.0, description='Downloading', max=112.0, style=ProgressStyle(description_…




HBox(children=(FloatProgress(value=0.0, description='Downloading', max=365.0, style=ProgressStyle(description_…


QuestionAnsweringModelOutput(loss=None, start_logits=tensor([[ 1.1368, -4.9146, -5.2487, -7.3861, -7.6255, -5.4474, -7.0285, -8.2898,
         -7.5452,  0.1335,  0.8179, -0.4820, -2.7206, -0.5917, -0.9558, -0.1014,
          6.7624, -2.4672, -0.1479, -4.4067, -1.0293, -0.7967, -4.7433]],
       grad_fn=<CloneBackward0>), end_logits=tensor([[ 1.8309, -5.8596, -4.3662, -8.0650, -8.4170, -6.2748, -6.0801, -7.8794,
         -6.3227, -6.1576, -3.7363, -0.5591, -4.0226, -2.5224,  1.2005, -0.4061,
          5.9079, -1.4456,  2.0518, -2.9552,  5.7826,  6.1044, -2.8787]],
       grad_fn=<CloneBackward0>), hidden_states=None, attentions=None)


In [13]:
# Code Block 4: papluca/xlm-roberta-base-language-detection
!pip install transformers==4.12.5 torch==1.10.0 datasets==1.15.1 tokenizers==0.10.3

from transformers import AutoModelForSequenceClassification, AutoTokenizer

model_name = "papluca/xlm-roberta-base-language-detection"
model = AutoModelForSequenceClassification.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

text = "This is a test sentence."
inputs = tokenizer(text, return_tensors="pt")
outputs = model(**inputs)
print(outputs)


Defaulting to user installation because normal site-packages is not writeable
Collecting transformers==4.12.5
  Using cached transformers-4.12.5-py3-none-any.whl.metadata (56 kB)
Collecting torch==1.10.0
  Downloading torch-1.10.0-cp39-cp39-manylinux1_x86_64.whl.metadata (24 kB)
Collecting datasets==1.15.1
  Downloading datasets-1.15.1-py3-none-any.whl.metadata (19 kB)
Collecting tokenizers==0.10.3
  Downloading tokenizers-0.10.3-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl.metadata (5.8 kB)
Collecting sacremoses (from transformers==4.12.5)
  Using cached sacremoses-0.1.1-py3-none-any.whl.metadata (8.3 kB)
Downloading transformers-4.12.5-py3-none-any.whl (3.1 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m3.1/3.1 MB[0m [31m28.6 MB/s[0m eta [36m0:00:00[0m
[?25hDownloading torch-1.10.0-cp39-cp39-manylinux1_x86_64.whl (881.9 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m881.9/881.9 MB[0m [31m

Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/transformers/utils/import_utils.py", line 1126, in _get_module
  File "/usr/lib64/python3.9/importlib/__init__.py", line 127, in import_module
    return _bootstrap._gcd_import(name[level:], package, level)
  File "<frozen importlib._bootstrap>", line 1030, in _gcd_import
  File "<frozen importlib._bootstrap>", line 1007, in _find_and_load
  File "<frozen importlib._bootstrap>", line 984, in _find_and_load_unlocked
ModuleNotFoundError: No module named 'transformers.models.ernie_m.configuration_ernie_m'

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/IPython/core/interactiveshell.py", line 3550, in run_code
    exec(code_obj, self.user_global_ns, self.user_ns)
  File "/tmp/ipykernel_13607/1299212770.py", line 7, in <module>
    model = AutoModelForSequenceClassification.from_pretra

In [2]:
!pip uninstall -y evaluate facenet-pytorch peft torchaudio torchvision xformers 
!pip install transformers==4.12.5 torch==1.10.0 datasets==1.15.1 tokenizers==0.10.3



huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Found existing installation: evaluate 0.4.3
Uninstalling evaluate-0.4.3:
  Successfully uninstalled evaluate-0.4.3
[0mFound existing installation: peft 0.9.0
Uninstalling peft-0.9.0:
  Successfully uninstalled peft-0.9.0
[0mFound existing installation: torchvision 0.16.0
Uninstalling torchvision-0.16.0:
  Successfully uninstalled torchvision-0.16.0
[0m

huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)


Defaulting to user installation because normal site-packages is not writeable
Collecting transformers==4.12.5
  Using cached transformers-4.12.5-py3-none-any.whl.metadata (56 kB)
Collecting torch==1.10.0
  Using cached torch-1.10.0-cp39-cp39-manylinux1_x86_64.whl.metadata (24 kB)
Collecting datasets==1.15.1
  Using cached datasets-1.15.1-py3-none-any.whl.metadata (19 kB)
Collecting tokenizers==0.10.3
  Using cached tokenizers-0.10.3-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl.metadata (5.8 kB)
Using cached transformers-4.12.5-py3-none-any.whl (3.1 MB)
Using cached torch-1.10.0-cp39-cp39-manylinux1_x86_64.whl (881.9 MB)
Using cached datasets-1.15.1-py3-none-any.whl (290 kB)
Using cached tokenizers-0.10.3-cp39-cp39-manylinux_2_5_x86_64.manylinux1_x86_64.manylinux_2_12_x86_64.manylinux2010_x86_64.whl (3.3 MB)
Installing collected packages: tokenizers, torch, transformers, datasets
  Attempting uninstall: tokenizers
    Found existing ins

In [1]:
from transformers import AutoModelForSequenceClassification, AutoTokenizer

model_name = "papluca/xlm-roberta-base-language-detection"
model = AutoModelForSequenceClassification.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

text = "This is a test sentence."
inputs = tokenizer(text, return_tensors="pt")
outputs = model(**inputs)
print(outputs)


2025-03-24 01:08:56.393502: I tensorflow/core/util/port.cc:153] oneDNN custom operations are on. You may see slightly different numerical results due to floating-point round-off errors from different computation orders. To turn them off, set the environment variable `TF_ENABLE_ONEDNN_OPTS=0`.
2025-03-24 01:08:56.410381: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:477] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered
E0000 00:00:1742778536.430523   16690 cuda_dnn.cc:8310] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered
E0000 00:00:1742778536.436499   16690 cuda_blas.cc:1418] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered
2025-03-24 01:08:56.459213: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instr

Downloading:   0%|          | 0.00/1.38k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/1.04G [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/502 [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/4.83M [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/8.66M [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/239 [00:00<?, ?B/s]

SequenceClassifierOutput(loss=None, logits=tensor([[-0.9294,  0.2665, -1.2123, -0.6366, -0.4184, -0.1648, -0.4607,  0.2771,
         -0.0657, -0.9682,  0.2180,  0.5397, -0.5279,  7.0440, -0.4062, -1.3086,
         -0.0667, -0.5790,  0.1626, -0.0940]], grad_fn=<AddmmBackward0>), hidden_states=None, attentions=None)


In [15]:
# Code Block 5: TieIncred/distilbert-base-uncased-finetuned-emotional
!pip install transformers==4.16.2 torch==2.1.0 datasets==2.9.0 tokenizers==0.14.1

from transformers import AutoModelForSequenceClassification, AutoTokenizer

model_name = "TieIncred/distilbert-base-uncased-finetuned-emotional"
model = AutoModelForSequenceClassification.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

text = "I feel great about dependency conflict experiments!"
inputs = tokenizer(text, return_tensors="pt")
outputs = model(**inputs)
print(outputs)


Defaulting to user installation because normal site-packages is not writeable
Collecting transformers==4.16.2
  Using cached transformers-4.16.2-py3-none-any.whl.metadata (61 kB)
Collecting torch==2.1.0
  Using cached torch-2.1.0-cp39-cp39-manylinux1_x86_64.whl.metadata (25 kB)
Collecting datasets==2.9.0
  Downloading datasets-2.9.0-py3-none-any.whl.metadata (19 kB)
Collecting tokenizers==0.14.1
  Downloading tokenizers-0.14.1-cp39-cp39-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (6.7 kB)
Collecting nvidia-cuda-nvrtc-cu12==12.1.105 (from torch==2.1.0)
  Using cached nvidia_cuda_nvrtc_cu12-12.1.105-py3-none-manylinux1_x86_64.whl.metadata (1.5 kB)
Collecting nvidia-cuda-runtime-cu12==12.1.105 (from torch==2.1.0)
  Using cached nvidia_cuda_runtime_cu12-12.1.105-py3-none-manylinux1_x86_64.whl.metadata (1.5 kB)
Collecting nvidia-cuda-cupti-cu12==12.1.105 (from torch==2.1.0)
  Using cached nvidia_cuda_cupti_cu12-12.1.105-py3-none-manylinux1_x86_64.whl.metadata (1.6 kB)
Collecting

Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/transformers/utils/import_utils.py", line 1126, in _get_module
  File "/usr/lib64/python3.9/importlib/__init__.py", line 127, in import_module
    return _bootstrap._gcd_import(name[level:], package, level)
  File "<frozen importlib._bootstrap>", line 1030, in _gcd_import
  File "<frozen importlib._bootstrap>", line 1007, in _find_and_load
  File "<frozen importlib._bootstrap>", line 984, in _find_and_load_unlocked
ModuleNotFoundError: No module named 'transformers.models.ernie_m.configuration_ernie_m'

The above exception was the direct cause of the following exception:

Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/IPython/core/interactiveshell.py", line 3550, in run_code
    exec(code_obj, self.user_global_ns, self.user_ns)
  File "/tmp/ipykernel_13607/3975985701.py", line 7, in <module>
    model = AutoModelForSequenceClassification.from_pretra

In [7]:
!pip uninstall -y diffusers facenet-pytorch gradio gradio-client torchaudio torchvision xformers aiofiles markupsafe urllib3 huggingface-hub sentence-transformers
!pip install torch==2.1.0 transformers==4.16.2 datasets==2.9.0 tokenizers==0.14.1 torchvision==0.16.0 sentence-transformers==2.2.2

huggingface/tokenizers: The current process just got forked, after parallelism has already been used. Disabling parallelism to avoid deadlocks...
	- Avoid using `tokenizers` before the fork if possible
	- Explicitly set the environment variable TOKENIZERS_PARALLELISM=(true | false)
[0mFound existing installation: MarkupSafe 3.0.2
Uninstalling MarkupSafe-3.0.2:
[31mERROR: Exception:
Traceback (most recent call last):
  File "/usr/lib64/python3.9/shutil.py", line 825, in move
    os.rename(src, real_dst)
OSError: [Errno 18] Invalid cross-device link: '/usr/local/lib64/python3.9/site-packages/MarkupSafe-3.0.2.dist-info/' -> '/tmp/pip-uninstall-5wwwsd3c'

During handling of the above exception, another exception occurred:

Traceback (most recent call last):
  File "/home/ec2-user/.local/lib/python3.9/site-packages/pip/_internal/cli/base_command.py", line 106, in _run_wrapper
    status = _inner_run()
  File "/home/ec2-user/.local/lib/python3.9/site-packages/pip/_internal/cli/base_command

In [1]:
from transformers import AutoModelForSequenceClassification, AutoTokenizer

model_name = "TieIncred/distilbert-base-uncased-finetuned-emotional"
model = AutoModelForSequenceClassification.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)

text = "I feel great about dependency conflict experiments!"
inputs = tokenizer(text, return_tensors="pt")
outputs = model(**inputs)
print(outputs)

Downloading:   0%|          | 0.00/883 [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/255M [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/333 [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/226k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/695k [00:00<?, ?B/s]

Downloading:   0%|          | 0.00/112 [00:00<?, ?B/s]

SequenceClassifierOutput(loss=None, logits=tensor([[-1.3230,  5.9586, -1.2204, -2.0150, -1.9393, -1.0871]],
       grad_fn=<AddmmBackward0>), hidden_states=None, attentions=None)
