In [None]:
import torch
print("GPU Available:", torch.cuda.is_available())

# Model and Tokenizer Initialization

In [None]:
from transformers import AutoModelForSeq2SeqLM, AutoTokenizer
import torch

model_name = "google/flan-t5-small"
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
model = model.to("cuda")  # Move to GPU


The first part of the notebook handles the loading of the Large Language Model and its tokenizer from the Hugging Face library.

# Text Generation Examples


This section demonstrates how to format prompts and configure the model's generation parameters.

In [None]:
prompt = "Explain gravity in one sentence"
inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
outputs = model.generate(**inputs, max_length=50)
response = tokenizer.decode(outputs[0], skip_special_tokens=True)
print("LLM Response:", response)  # Output: The capital of France is Paris.

In [None]:
# Load model directly
from transformers import AutoTokenizer, AutoModelForCausalLM

tokenizer = AutoTokenizer.from_pretrained("openai-community/gpt2")
model = AutoModelForCausalLM.from_pretrained("openai-community/gpt2")
model.to("cuda")

In [None]:
prompt = "What is the capital of Pakistan"
inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
outputs = model.generate(**inputs, max_length=50)
response = tokenizer.decode(outputs[0], skip_special_tokens=True)
print("LLM Response:", response)

In [None]:
# Load model directly
from transformers import AutoTokenizer, AutoModelForCausalLM

tokenizer = AutoTokenizer.from_pretrained("distilbert/distilgpt2")
model = AutoModelForCausalLM.from_pretrained("distilbert/distilgpt2")
model.to("cuda")

In [None]:
prompt ="Tell me about California"
inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
outputs = model.generate(**inputs, max_length=50)
response = tokenizer.decode(outputs[0], skip_special_tokens=True)
print("LLM Response:", response)

In [None]:
# Load model directly
from transformers import AutoTokenizer, AutoModelForCausalLM

tokenizer = AutoTokenizer.from_pretrained("KoboldAI/fairseq-dense-125M")
model = AutoModelForCausalLM.from_pretrained("KoboldAI/fairseq-dense-125M")
model.to("cuda")

In [None]:
prompt ="What is the capital of France"
inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
outputs = model.generate(**inputs, max_length=50)
response = tokenizer.decode(outputs[0], skip_special_tokens=True)
print("LLM Response:", response)

In [None]:
prompt = "What is the weather in Karachi today?"

inputs = tokenizer(prompt, return_tensors="pt").to("cuda")
outputs = model.generate(**inputs, max_length=50)
response = tokenizer.decode(outputs[0], skip_special_tokens=True)
print("LLM Response:", response)

In [None]:
prompt = "Instruction: Explain gravity in one clear sentence.\nAnswer:"
inputs = tokenizer(prompt, return_tensors="pt").to("cuda")

outputs = model.generate(
    **inputs,
    max_length=50,
    do_sample=True,   # allows randomness
    top_k=50,
    temperature=0.7
)

response = tokenizer.decode(outputs[0], skip_special_tokens=True)
print("LLM Response:", response)

