In [3]:

from transformers import BartTokenizer, BartForConditionalGeneration

# Load tokenizer and model
tokenizer = BartTokenizer.from_pretrained('facebook/bart-large-cnn')
model = BartForConditionalGeneration.from_pretrained('facebook/bart-large-cnn')

# Input text
text = """
Dr. A.P.J. Abdul Kalam, popularly known as the 'Missile Man of India', was a renowned aerospace scientist and the 11th President of India.
He played a pivotal role in India's Pokhran-II nuclear tests in 1998, which established India as a nuclear power.
Born in a modest family in Rameswaram, Tamil Nadu, Dr. Kalam rose through hard work, education, and integrity.
He was instrumental in the development of India’s missile and satellite programs during his tenure at DRDO and ISRO.
A beloved teacher and motivator, Dr. Kalam authored several inspirational books including 'Wings of Fire' and 'Ignited Minds'.
He dedicated his life to youth empowerment and nation-building, continuing to teach and inspire students until his last breath.
His humility, vision, and patriotism earned him immense respect across the world.
"""

# Tokenize and summarize
inputs = tokenizer([text], max_length=1024, return_tensors='pt', truncation=True)
summary_ids = model.generate(
    inputs['input_ids'],
    max_length=100,
    min_length=30,
    length_penalty=2.0,
    num_beams=4,
    early_stopping=True
)

# Decode and print summary
summary = tokenizer.decode(summary_ids[0], skip_special_tokens=True)
print("Summary:", summary)




Summary: Dr. A.P.J. Abdul Kalam was a renowned aerospace scientist and the 11th President of India. He played a pivotal role in India's Pokhran-II nuclear tests in 1998, which established India as a nuclear power.


In [4]:
from transformers import T5Tokenizer, T5ForConditionalGeneration

# Load tokenizer and model
tokenizer = T5Tokenizer.from_pretrained("google/flan-t5-base")
model = T5ForConditionalGeneration.from_pretrained("google/flan-t5-base")

# Prompt-based input (summarization)
prompt = """Summarize: Dr. A.P.J. Abdul Kalam, popularly known as the 'Missile Man of India', was a renowned aerospace scientist and the 11th President of India.
He played a pivotal role in India's Pokhran-II nuclear tests in 1998, which established India as a nuclear power.
Born in a modest family in Rameswaram, Tamil Nadu, Dr. Kalam rose through hard work, education, and integrity.
He was instrumental in the development of India’s missile and satellite programs during his tenure at DRDO and ISRO.
A beloved teacher and motivator, Dr. Kalam authored several inspirational books including 'Wings of Fire' and 'Ignited Minds'.
He dedicated his life to youth empowerment and nation-building, continuing to teach and inspire students until his last breath.
His humility, vision, and patriotism earned him immense respect across the world."""

# Tokenize input
inputs = tokenizer(prompt, return_tensors="pt")

# Generate summary
outputs = model.generate(**inputs, max_length=100, num_beams=4, early_stopping=True)

# Decode and print result
summary = tokenizer.decode(outputs[0], skip_special_tokens=True)
print("Generated Summary:", summary)


You are using the default legacy behaviour of the <class 'transformers.models.t5.tokenization_t5.T5Tokenizer'>. This is expected, and simply means that the `legacy` (previous) behavior will be used so nothing changes for you. If you want to use the new behaviour, set `legacy=False`. This should only be set if you understand what it means, and thoroughly read the reason why this was added as explained in https://github.com/huggingface/transformers/pull/24565


Generated Summary: Dr. A.P.J. Abdul Kalam was born in Rameswaram, Tamil Nadu.
