In [1]:
!pip install transformers gradio

Collecting gradio
  Downloading gradio-5.9.1-py3-none-any.whl.metadata (16 kB)
Collecting aiofiles<24.0,>=22.0 (from gradio)
  Downloading aiofiles-23.2.1-py3-none-any.whl.metadata (9.7 kB)
Collecting fastapi<1.0,>=0.115.2 (from gradio)
  Downloading fastapi-0.115.6-py3-none-any.whl.metadata (27 kB)
Collecting ffmpy (from gradio)
  Downloading ffmpy-0.5.0-py3-none-any.whl.metadata (3.0 kB)
Collecting gradio-client==1.5.2 (from gradio)
  Downloading gradio_client-1.5.2-py3-none-any.whl.metadata (7.1 kB)
Collecting markupsafe~=2.0 (from gradio)
  Downloading MarkupSafe-2.1.5-cp310-cp310-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metadata (3.0 kB)
Collecting pydub (from gradio)
  Downloading pydub-0.25.1-py2.py3-none-any.whl.metadata (1.4 kB)
Collecting python-multipart>=0.0.18 (from gradio)
  Downloading python_multipart-0.0.20-py3-none-any.whl.metadata (1.8 kB)
Collecting ruff>=0.2.2 (from gradio)
  Downloading ruff-0.8.6-py3-none-manylinux_2_17_x86_64.manylinux2014_x86_64.whl.metad

In [2]:
import gradio as gr
import pandas as pd
from transformers import T5Tokenizer, T5ForConditionalGeneration, MBartForConditionalGeneration, AutoTokenizer

# Load the models and tokenizers
vit5_model_path = "/content/drive/MyDrive/NLP/finetuned/vit5-finetuned"
mbart_model_path = "/content/drive/MyDrive/NLP/finetuned/vit5-finetuned"

# Load models and tokenizers
vit5_tokenizer = T5Tokenizer.from_pretrained(vit5_model_path)
vit5_model = T5ForConditionalGeneration.from_pretrained(vit5_model_path)

mbart_tokenizer = AutoTokenizer.from_pretrained(mbart_model_path)
mbart_model = MBartForConditionalGeneration.from_pretrained(mbart_model_path)

# Function to generate summary
def generate_summary(input_text, model_name):
    if model_name == "vit5":
        tokenizer, model = vit5_tokenizer, vit5_model
    elif model_name == "mbart":
        tokenizer, model = mbart_tokenizer, mbart_model
    else:
        return "Invalid model selected."

    input_ids = tokenizer("summarize: " + input_text, return_tensors="pt", max_length=512, truncation=True).input_ids
    output_ids = model.generate(input_ids, max_length=128, num_beams=4, early_stopping=True)
    summary = tokenizer.decode(output_ids[0], skip_special_tokens=True)
    return summary

# Gradio interface
iface = gr.Interface(
    fn=generate_summary,
    inputs=[
        gr.Textbox(lines=10, placeholder="Enter article text here...", label="Input Text"),
        gr.Radio(choices=["vit5", "mbart"], label="Select Model", value="vit5")
    ],
    outputs=gr.Textbox(label="Summary"),
    title="Text Summarization",
    description="Enter an article and select a model to get a concise summary.",
    flagging_mode="never"
)

iface.launch()


You set `add_prefix_space`. The tokenizer needs to be converted from the slow tokenizers
You are using a model of type t5 to instantiate a model of type mbart. This is not supported for all configurations of models and can yield errors.
Some weights of MBartForConditionalGeneration were not initialized from the model checkpoint at /content/drive/MyDrive/NLP/finetuned/vit5-finetuned and are newly initialized: ['decoder.embed_positions.weight', 'decoder.layer_norm.bias', 'decoder.layer_norm.weight', 'decoder.layernorm_embedding.bias', 'decoder.layernorm_embedding.weight', 'decoder.layers.0.encoder_attn.k_proj.bias', 'decoder.layers.0.encoder_attn.k_proj.weight', 'decoder.layers.0.encoder_attn.out_proj.bias', 'decoder.layers.0.encoder_attn.out_proj.weight', 'decoder.layers.0.encoder_attn.q_proj.bias', 'decoder.layers.0.encoder_attn.q_proj.weight', 'decoder.layers.0.encoder_attn.v_proj.bias', 'decoder.layers.0.encoder_attn.v_proj.weight', 'decoder.layers.0.encoder_attn_layer_norm.bias', 'd

Running Gradio in a Colab notebook requires sharing enabled. Automatically setting `share=True` (you can turn this off by setting `share=False` in `launch()` explicitly).

Colab notebook detected. To show errors in colab notebook, set debug=True in launch()
* Running on public URL: https://beda072a5c6e731eed.gradio.live

This share link expires in 72 hours. For free permanent hosting and GPU upgrades, run `gradio deploy` from the terminal in the working directory to deploy to Hugging Face Spaces (https://huggingface.co/spaces)


