# Sentiment analysis

In [17]:
# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("text-classification", model="tabularisai/multilingual-sentiment-analysis")

Device set to use cpu


In [18]:
text1 = "I like cricket"
text2 = "I hate cricket"

In [19]:
classification1 = pipe(text1)
classification2 = pipe(text2)
print(classification1)
print(classification2)

[{'label': 'Positive', 'score': 0.5761851668357849}]
[{'label': 'Negative', 'score': 0.6629091501235962}]


# Zero - Shot classifier

In [20]:
# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("zero-shot-classification", model="MoritzLaurer/bge-m3-zeroshot-v2.0")

Device set to use cpu


In [26]:
text = "I like cricket"
classes = ["Education", "Sports", "business"]

In [27]:
classification = pipe(text, classes)
print(classification)

{'sequence': 'I like cricket', 'labels': ['Sports', 'Education', 'business'], 'scores': [0.9975178837776184, 0.001547313411720097, 0.0009348341263830662]}


# Text generation

In [35]:
# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("text-generation", model="distilgpt2")

config.json:   0%|          | 0.00/762 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/353M [00:00<?, ?B/s]

generation_config.json:   0%|          | 0.00/124 [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/26.0 [00:00<?, ?B/s]

vocab.json:   0%|          | 0.00/1.04M [00:00<?, ?B/s]

merges.txt:   0%|          | 0.00/456k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/1.36M [00:00<?, ?B/s]

Device set to use cpu


In [38]:
text = "What is python"

In [42]:
genr = pipe(text, max_new_tokens=30)
print(genr)

Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


[{'generated_text': 'What is python.py with Python 3.8.5 and later.'}]


# NER

In [50]:
# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("ner", grouped_entities=True)

No model was supplied, defaulted to dbmdz/bert-large-cased-finetuned-conll03-english and revision 4c53496 (https://huggingface.co/dbmdz/bert-large-cased-finetuned-conll03-english).
Using a pipeline without specifying a model name and revision in production is not recommended.
Some weights of the model checkpoint at dbmdz/bert-large-cased-finetuned-conll03-english were not used when initializing BertForTokenClassification: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
- This IS expected if you are initializing BertForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Device set to use cpu


In [56]:
text = "My name is Syed Najiullah and I work for PureLogics."

In [58]:
ner = pipe(text)
print(ner)

[{'entity_group': 'PER', 'score': np.float32(0.9989508), 'word': 'Syed Najiullah', 'start': 11, 'end': 25}, {'entity_group': 'ORG', 'score': np.float32(0.9967527), 'word': 'PureLogics', 'start': 41, 'end': 51}]


# Question Answering

In [59]:
# Use a pipeline as a high-level helper
from transformers import pipeline

pipe = pipeline("question-answering")

No model was supplied, defaulted to distilbert/distilbert-base-cased-distilled-squad and revision 564e9b5 (https://huggingface.co/distilbert/distilbert-base-cased-distilled-squad).
Using a pipeline without specifying a model name and revision in production is not recommended.


config.json:   0%|          | 0.00/473 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/261M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/49.0 [00:00<?, ?B/s]

vocab.txt: 0.00B [00:00, ?B/s]

tokenizer.json: 0.00B [00:00, ?B/s]

Device set to use cpu


In [60]:
pipe(question="What is my name?", context="My name is Syed Najiullah and I work for PureLogics.")

{'score': 0.9920346047674684,
 'start': 11,
 'end': 25,
 'answer': 'Syed Najiullah'}