In [1]:
# Check if the model is correctly loaded
from transformers import DistilBertForSequenceClassification, DistilBertTokenizer

In [2]:
# Check if the model is correctly loaded
from transformers import DistilBertForSequenceClassification, DistilBertTokenizer

model_name = 'distilbert-base-uncased-finetuned-sst-2-english'
model = DistilBertForSequenceClassification.from_pretrained(model_name)
tokenizer = DistilBertTokenizer.from_pretrained(model_name)

# Display model and tokenizer details
print(model.config)
print(tokenizer)

DistilBertConfig {
  "_name_or_path": "distilbert-base-uncased-finetuned-sst-2-english",
  "activation": "gelu",
  "architectures": [
    "DistilBertForSequenceClassification"
  ],
  "attention_dropout": 0.1,
  "dim": 768,
  "dropout": 0.1,
  "finetuning_task": "sst-2",
  "hidden_dim": 3072,
  "id2label": {
    "0": "NEGATIVE",
    "1": "POSITIVE"
  },
  "initializer_range": 0.02,
  "label2id": {
    "NEGATIVE": 0,
    "POSITIVE": 1
  },
  "max_position_embeddings": 512,
  "model_type": "distilbert",
  "n_heads": 12,
  "n_layers": 6,
  "output_past": true,
  "pad_token_id": 0,
  "qa_dropout": 0.1,
  "seq_classif_dropout": 0.2,
  "sinusoidal_pos_embds": false,
  "tie_weights_": true,
  "transformers_version": "4.42.4",
  "vocab_size": 30522
}

DistilBertTokenizer(name_or_path='distilbert-base-uncased-finetuned-sst-2-english', vocab_size=30522, model_max_length=512, is_fast=False, padding_side='right', truncation_side='right', special_tokens={'unk_token': '[UNK]', 'sep_token': '[SEP]', '

In [3]:
# Verify Environment and Library Versions

import transformers

# Print the version of transformers library
print(transformers.__version__)

4.42.4


In [5]:
from transformers import pipeline, DistilBertForSequenceClassification, DistilBertTokenizer

In [6]:
# Load the pre-trained model and tokenizer
model_name = 'distilbert-base-uncased-finetuned-sst-2-english'
model = DistilBertForSequenceClassification.from_pretrained(model_name)
tokenizer = DistilBertTokenizer.from_pretrained(model_name)

In [7]:
# Specify the task and the pre-trained model
pipe = pipeline(task='sentiment-analysis', model=model, tokenizer=tokenizer)

Hardware accelerator e.g. GPU is available in the environment, but no `device` argument is passed to the `Pipeline` object. Model will be on CPU.


In [8]:
# Example text data
data = [
    "I love this movie, it was fantastic!",
    "The film was boring and too long.",
    "An excellent performance by the lead actor.",
    "Not my cup of tea, I didn't enjoy it."
]


In [9]:
# Make predictions
preds = pipe(data)

In [10]:
# Inspect the predictions
for text, pred in zip(data, preds):
    print(f'Text: {text}')
    print(f'Prediction: {pred}\n')

Text: I love this movie, it was fantastic!
Prediction: {'label': 'POSITIVE', 'score': 0.9998763799667358}

Text: The film was boring and too long.
Prediction: {'label': 'NEGATIVE', 'score': 0.9997709393501282}

Text: An excellent performance by the lead actor.
Prediction: {'label': 'POSITIVE', 'score': 0.9998691082000732}

Text: Not my cup of tea, I didn't enjoy it.
Prediction: {'label': 'NEGATIVE', 'score': 0.9989538192749023}

