In [None]:
# !pip install -U transformers[sentencepiece]
import transformers
from transformers import pipeline
import gc
import torch
from transformers import AutoTokenizer
from transformers import AutoModelForSequenceClassification
from torch.nn.functional import softmax

In [None]:
classifier=pipeline("zero-shot-classification", model="MoritzLaurer/mDeBERTa-v3-base-xnli-multilingual-nli-2mil7")
classifier(["I am crying because my friend cat died. But the twist is that I am the one who killed the cat and tbh i killed almost 80% of the cats. My goal is to make a cat-free world! I just want to hide my cruel face. So I just acted like I'm crying. I am in face very happy that the ugly cat and 80% of those ugly faces are now gone"],
           candidate_labels=[
               "Personal: Refers to a person's own things",
               "Emotional: Refers to expression of emotion",
               "Friendship: Refers to being friendly and being there for each other whenever required",
               "Murder: Refers to an action of killing someone/something",
               "Genocide: Refers to an action of killing some species in large groups",
               "Love: Refers to being loved/loving",
               "Future: Refers to an action that's going to happen"
           ])

Device set to use cuda:0


[{'sequence': "I am crying because my friend cat died. But the twist is that I am the one who killed the cat and tbh i killed almost 80% of the cats. My goal is to make a cat-free world! I just want to hide my cruel face. So I just acted like I'm crying. I am in face very happy that the ugly cat and 80% of those ugly faces are now gone",
  'labels': ['Murder: Refers to an action of killing someone/something',
   "Personal: Refers to a person's own things",
   'Genocide: Refers to an action of killing some species in large groups',
   'Emotional: Refers to expression of emotion',
   "Future: Refers to an action that's going to happen",
   'Love: Refers to being loved/loving',
   'Friendship: Refers to being friendly and being there for each other whenever required'],
  'scores': [0.7230494618415833,
   0.11240963637828827,
   0.09355559945106506,
   0.05854560062289238,
   0.011416277848184109,
   0.0007937590125948191,
   0.00022964751406107098]}]

In [None]:
# ?transformers.pipelines.ZeroShotClassificationPipeline

In [None]:
generator=pipeline("text-generation", model="Qwen/Qwen3-0.6B")
generator("The project we are going to work is", max_length=30, num_return_sequences=2)

Device set to use cuda:0
Truncation was not explicitly activated but `max_length` is provided a specific value, please use `truncation=True` to explicitly truncate examples to max length. Defaulting to 'longest_first' truncation strategy. If you encode pairs of sequences (GLUE-style) with the tokenizer you can select this strategy more precisely by providing a specific strategy to `truncation`.
Both `max_new_tokens` (=256) and `max_length`(=30) seem to have been set. `max_new_tokens` will take precedence. Please refer to the documentation for more information. (https://huggingface.co/docs/transformers/main/en/main_classes/text_generation)


[{'generated_text': "The project we are going to work is a big project. I need to write a response to the project manager that says that I have the following objectives: 1. Develop a comprehensive database of the project data. 2. Develop a system for analyzing and reporting the project data. 3. Develop a comprehensive plan for the project. 4. Develop a training program for the team members. 5. Monitor the progress of the project and evaluate its performance. 6. Ensure that all project documents are stored in a secure and accessible location. 7. Create a system for managing the project resources. 8. Develop a comprehensive and flexible framework for the project. 9. Create a report for the team members on the project's status and performance. 10. Develop a system for tracking the project's progress and ensuring its success. 11. Create a report for the project team on the project's progress and success. 12. Ensure that all project resources are fully utilized. 13. Create a system for the 

In [None]:
unmasker=pipeline("fill-mask", model="google-bert/bert-base-uncased")
unmasker("Osama bin laden bombed the [MASK] towers and is responsible for 9/11 attacks.", top_k=2)

Some weights of the model checkpoint at google-bert/bert-base-uncased were not used when initializing BertForMaskedLM: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'cls.seq_relationship.bias', 'cls.seq_relationship.weight']
- This IS expected if you are initializing BertForMaskedLM from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForMaskedLM from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Device set to use cuda:0


[{'score': 0.7213783264160156,
  'token': 5519,
  'token_str': 'twin',
  'sequence': 'osama bin laden bombed the twin towers and is responsible for 9 / 11 attacks.'},
 {'score': 0.0945662409067154,
  'token': 2048,
  'token_str': 'two',
  'sequence': 'osama bin laden bombed the two towers and is responsible for 9 / 11 attacks.'}]

In [None]:
recognizer=pipeline("ner", grouped_entities=True)
recognizer("My name is Harsha and I am working at Maheswari Pvt Ltd.")

No model was supplied, defaulted to dbmdz/bert-large-cased-finetuned-conll03-english and revision 4c53496 (https://huggingface.co/dbmdz/bert-large-cased-finetuned-conll03-english).
Using a pipeline without specifying a model name and revision in production is not recommended.
Some weights of the model checkpoint at dbmdz/bert-large-cased-finetuned-conll03-english were not used when initializing BertForTokenClassification: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
- This IS expected if you are initializing BertForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).
Device set to use cuda:0


[{'entity_group': 'PER',
  'score': np.float32(0.9951605),
  'word': 'Harsha',
  'start': 11,
  'end': 17},
 {'entity_group': 'ORG',
  'score': np.float32(0.9825239),
  'word': 'Maheswari Pvt Ltd',
  'start': 38,
  'end': 55}]

In [None]:
summarizer=pipeline("summarization")
summarizer(
    """
    The project we are going to work is about the development of the education sector in rural areas. The project is aimed at the development of the education sector in rural areas in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region. The project is about the development of the education sector in the region.\n\nI think that the project is about the development of the education sector in the region. So, I will proceed to work on this project.\n\nNow, I have to write the project description. The project description should start with the
    """
)

No model was supplied, defaulted to sshleifer/distilbart-cnn-12-6 and revision a4f8f3e (https://huggingface.co/sshleifer/distilbart-cnn-12-6).
Using a pipeline without specifying a model name and revision in production is not recommended.
Device set to use cuda:0


[{'summary_text': ' The project we are going to work is about the development of the education sector in rural areas in the region . The project is aimed at the development . of the . development of . the education . sector in the . region. The project description should start with the project description of the project .'}]

In [None]:
classifier=pipeline("text-generation", model="Qwen/Qwen2.5-7B-Instruct")
# ?transformers.pipelines.TextGenerationPipeline

The secret `HF_TOKEN` does not exist in your Colab secrets.
To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.
You will be able to reuse this secret in all of your notebooks.
Please note that authentication is recommended but still optional to access public models or datasets.


config.json:   0%|          | 0.00/663 [00:00<?, ?B/s]

model.safetensors.index.json: 0.00B [00:00, ?B/s]

Fetching 4 files:   0%|          | 0/4 [00:00<?, ?it/s]

model-00004-of-00004.safetensors:   0%|          | 0.00/3.56G [00:00<?, ?B/s]

model-00003-of-00004.safetensors:   0%|          | 0.00/3.86G [00:00<?, ?B/s]

model-00001-of-00004.safetensors:   0%|          | 0.00/3.95G [00:00<?, ?B/s]

model-00002-of-00004.safetensors:   0%|          | 0.00/3.86G [00:00<?, ?B/s]

Loading checkpoint shards:   0%|          | 0/4 [00:00<?, ?it/s]

generation_config.json:   0%|          | 0.00/243 [00:00<?, ?B/s]

tokenizer_config.json: 0.00B [00:00, ?B/s]

vocab.json: 0.00B [00:00, ?B/s]

merges.txt: 0.00B [00:00, ?B/s]

tokenizer.json: 0.00B [00:00, ?B/s]

Device set to use cuda:0


In [None]:
classifier("Classify sentiment as positive or negative. Output only the answer and no additional text: A good movie.", truncation=True, max_new_tokens=2)

[{'generated_text': 'Classify sentiment as positive or negative. Output only the answer and no additional text: A good movie. Positive\n\n'}]

In [None]:
gc.collect()
torch.cuda.empty_cache()

In [None]:
classifier=pipeline("sentiment-analysis")
classifier(["I've been waiting for a HuggingFace course my whole life.",
        "I hate this so much!"])

No model was supplied, defaulted to distilbert/distilbert-base-uncased-finetuned-sst-2-english and revision 714eb0f (https://huggingface.co/distilbert/distilbert-base-uncased-finetuned-sst-2-english).
Using a pipeline without specifying a model name and revision in production is not recommended.
The secret `HF_TOKEN` does not exist in your Colab secrets.
To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.
You will be able to reuse this secret in all of your notebooks.
Please note that authentication is recommended but still optional to access public models or datasets.


config.json:   0%|          | 0.00/629 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/268M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/48.0 [00:00<?, ?B/s]

vocab.txt: 0.00B [00:00, ?B/s]

Device set to use cuda:0


[{'label': 'POSITIVE', 'score': 0.9598046541213989},
 {'label': 'NEGATIVE', 'score': 0.9994558691978455}]

In [None]:
model_name="distilbert/distilbert-base-uncased-finetuned-sst-2-english"
tokenizer=AutoTokenizer.from_pretrained(model_name)

In [None]:
tokenizer

DistilBertTokenizerFast(name_or_path='distilbert/distilbert-base-uncased-finetuned-sst-2-english', vocab_size=30522, model_max_length=512, is_fast=True, padding_side='right', truncation_side='right', special_tokens={'unk_token': '[UNK]', 'sep_token': '[SEP]', 'pad_token': '[PAD]', 'cls_token': '[CLS]', 'mask_token': '[MASK]'}, clean_up_tokenization_spaces=True, added_tokens_decoder={
	0: AddedToken("[PAD]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
	100: AddedToken("[UNK]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
	101: AddedToken("[CLS]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
	102: AddedToken("[SEP]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
	103: AddedToken("[MASK]", rstrip=False, lstrip=False, single_word=False, normalized=False, special=True),
}
)

In [None]:
enc_inps=tokenizer(["I hate this so much!", "I like this so much, ya'know!"],
          truncation=True,
          padding=True,
          return_tensors="pt")
enc_inps

{'input_ids': tensor([[ 101, 1045, 5223, 2023, 2061, 2172,  999,  102,    0,    0,    0,    0],
        [ 101, 1045, 2066, 2023, 2061, 2172, 1010, 8038, 1005, 2113,  999,  102]]), 'attention_mask': tensor([[1, 1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0],
        [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]])}

In [None]:
model=AutoModelForSequenceClassification.from_pretrained(model_name)

In [None]:
logits=model(**enc_inps).logits
prob=softmax(logits, dim=-1)
display(prob)

tensor([[9.9946e-01, 5.4418e-04],
        [1.5020e-04, 9.9985e-01]], grad_fn=<SoftmaxBackward0>)

In [None]:
model.config.id2label

{0: 'NEGATIVE', 1: 'POSITIVE'}

In [None]:
from transformers import AutoTokenizer, AutoModelForCausalLM
from torch.nn.functional import softmax
import torch

In [None]:
model_name="openai-community/gpt2"

In [None]:
tokenizer=AutoTokenizer.from_pretrained(model_name)

The secret `HF_TOKEN` does not exist in your Colab secrets.
To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.
You will be able to reuse this secret in all of your notebooks.
Please note that authentication is recommended but still optional to access public models or datasets.


In [None]:
model=AutoModelForCausalLM.from_pretrained(model_name).to("cuda")

In [None]:
tokenizer.pad_token="<PAD>"
enc_inp=tokenizer(["Today, we are going to",
           "The project we are going to do is"],
          truncation=True,
          padding=True,
          return_tensors="pt",
          padding_side="left")
input_ids=enc_inp.input_ids.to("cuda")
attn_mask=enc_inp.attention_mask
input_ids

tensor([[50256, 50256,  8888,    11,   356,   389,  1016,   284],
        [  464,  1628,   356,   389,  1016,   284,   466,   318]],
       device='cuda:0')

In [None]:
for _ in range(100):
  logits=model(input_ids, attention_mask=attn_mask).logits[:,-1,:]
  # display(logits.size())
  prob=softmax(logits, dim=-1)
  # display(prob)
  next_token_id=torch.multinomial(prob, num_samples=1)
  input_ids=torch.cat([input_ids, next_token_id], dim=-1)
input_ids.size()

torch.Size([2, 108])

In [None]:
input_ids[0]
tokenizer.decode(input_ids[0],
                  skip_special_tokens=True)

'Today, we are going to, and on and, we today, or otherwise, we, our sometimes thus the Over Sometimes Everyday, we often, they, We now, the And Whenever, and, today of This Day on We, We We\n But A a Of And In on, Today, Often A Public, Today Now Sometimes Now So This, Today Every And, On Often By Often In Certainly Whether Found Day Today In This On the I, While On It So, people The Right Recent, And Normally, Today'

In [None]:
import torch
from transformers import AutoTokenizer, AutoModelForCausalLM
from torch.nn.functional import softmax

In [None]:
model_name="Qwen/Qwen3-0.6B"
tokenizer=AutoTokenizer.from_pretrained(model_name)

tokenizer_config.json: 0.00B [00:00, ?B/s]

vocab.json: 0.00B [00:00, ?B/s]

merges.txt: 0.00B [00:00, ?B/s]

tokenizer.json:   0%|          | 0.00/11.4M [00:00<?, ?B/s]

In [None]:
model=AutoModelForCausalLM.from_pretrained(model_name).to("cuda")

In [None]:
tokenizer.padding_side="left"
enc_inp=tokenizer(["Today, we are going to",
           "The project we are going to do is"],
          truncation=True,
          padding=True,
          return_tensors="pt").to("cuda")

In [None]:
inp_ids=enc_inp.input_ids
attn_mask=enc_inp.attention_mask

In [None]:
for _ in range(25):
  logits=model(input_ids=inp_ids,
        attention_mask=attn_mask).logits[:,-1,:]
  prob=softmax(logits, dim=-1)
  next_tkn_id=torch.multinomial(prob,
                                num_samples=1)
  inp_ids=torch.cat([inp_ids, next_tkn_id], dim=-1)

In [None]:
tokenizer.decode(inp_ids[0],
                 skip_special_tokens=True)

'Today, we are going to learn visit become finding watching yet islet atkeyword outline          ! today can tryorm for that we  Kim should Falling the'