In [1]:
# Install required packages if not already installed
%pip install --quiet transformers torch datasets pillow

# Verify installations
import transformers
import torch
import datasets

print(f"Transformers version: {transformers.__version__}")
print(f"PyTorch version: {torch.__version__}")
print(f"Datasets version: {datasets.__version__}")

Note: you may need to restart the kernel to use updated packages.
Transformers version: 4.53.2
PyTorch version: 2.7.1+cpu
Datasets version: 4.0.0


In [2]:
from transformers import AutoTokenizer, AutoModelForSequenceClassification, pipeline
import torch

# Load tokenizer and model
model_name = "cardiffnlp/twitter-roberta-base-sentiment-latest"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForSequenceClassification.from_pretrained(model_name)

# Set up the pipeline
classifier = pipeline("sentiment-analysis", model=model, tokenizer=tokenizer)

# Example text
texts = [
    "I'm loving this update!",
    "This is trash, I'm disappointed.",
    "Not sure how I feel about the changes."
]

# Get predictions
for text in texts:
    result = classifier(text)[0]
    print(f"Text: {text}")
    print(f"Sentiment: {result['label']}, Score: {result['score']:.4f}\n")


Some weights of the model checkpoint at cardiffnlp/twitter-roberta-base-sentiment-latest were not used when initializing RobertaForSequenceClassification: ['roberta.pooler.dense.bias', 'roberta.pooler.dense.weight']
- This IS expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing RobertaForSequenceClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Device set to use cpu


Text: I'm loving this update!
Sentiment: positive, Score: 0.9879

Text: This is trash, I'm disappointed.
Sentiment: negative, Score: 0.9461

Text: Not sure how I feel about the changes.
Sentiment: negative, Score: 0.5745



In [3]:
from transformers import pipeline
from PIL import Image
# Load an image classification pipeline
image_classifier = pipeline("image-classification", model="google/vit-base-patch16-224")
# Load an image
image = Image.open("dog.png")  # Use any local image path
# Perform classification
results = image_classifier(image)
for result in results:
  print(result)

Device set to use cpu


{'label': 'Egyptian cat', 'score': 0.8234645128250122}
{'label': 'tabby, tabby cat', 'score': 0.11641877889633179}
{'label': 'tiger cat', 'score': 0.053732335567474365}
{'label': 'lynx, catamount', 'score': 0.0012239273637533188}
{'label': 'Siamese cat, Siamese', 'score': 0.00013562229287344962}


In [4]:
from transformers import pipeline
 
# Load a speech recognition pipeline
speech_recognizer = pipeline("automatic-speech-recognition", model="facebook/wav2vec2-base-960h")
 
# Load an audio file (must be a .wav file)
audio_file = "harvard.wav"
 
# Transcribe the audio
result = speech_recognizer(audio_file)
print("Transcription:", result['text'])

Some weights of Wav2Vec2ForCTC were not initialized from the model checkpoint at facebook/wav2vec2-base-960h and are newly initialized: ['wav2vec2.masked_spec_embed']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.
Device set to use cpu


Transcription: THE STALE SMELL OF OLD BEER LINGERS IT TAKES HEAT TO BRING OUT THE ODOR A COLD DIP RESTORES HEALTH AND ZEST A SALT PICKLE TASTES FINE WITH HAM TAKOS AL PASTORE ARE MY FAVORITE A ZESTFUL FOOD IS THE HOT CROSS BUN


In [7]:
from transformers import AutoTokenizer, AutoModelForSequenceClassification
 
# Load model and tokenizer
tokenizer = AutoTokenizer.from_pretrained("bert-base-uncased")
model = AutoModelForSequenceClassification.from_pretrained("bert-base-uncased", num_labels=2)
 
# Example text
text = '''
This is a sample text for fine-tuning demonstration. This continues the sentence.
Now this is another sentence in a separate line.
'''
 
# Tokenize
inputs = tokenizer(text, return_tensors="pt")
print("Tokenized input:", inputs)

Some weights of BertForSequenceClassification were not initialized from the model checkpoint at bert-base-uncased and are newly initialized: ['classifier.bias', 'classifier.weight']
You should probably TRAIN this model on a down-stream task to be able to use it for predictions and inference.


Tokenized input: {'input_ids': tensor([[  101,  2023,  2003,  1037,  7099,  3793,  2005,  2986,  1011, 17372,
         10467,  1012,  2023,  4247,  1996,  6251,  1012,  2085,  2023,  2003,
          2178,  6251,  1999,  1037,  3584,  2240,  1012,   102]]), 'token_type_ids': tensor([[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
         0, 0, 0, 0]]), 'attention_mask': tensor([[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1]])}
