# 📝 Meeting Summarizer - Colab Version

Transcribe meeting audio and generate summaries using Whisper + a Transformer model (e.g., Pegasus or Mistral).

In [None]:
# 🔧 Install dependencies
!pip install transformers accelerate peft openai-whisper torch sentencepiece

## 📤 Upload your audio file

In [None]:
from google.colab import files
uploaded = files.upload()

audio_path = list(uploaded.keys())[0]

## 🎧 Transcribe audio with Whisper

In [None]:
import whisper
model = whisper.load_model("base")
result = model.transcribe(audio_path)
transcript = result["text"]
print(transcript)

## ✂️ Summarize the Transcript

In [None]:
from transformers import pipeline, AutoTokenizer, AutoModelForSeq2SeqLM

model_id = "google/pegasus-xsum"  # You can change this
tokenizer = AutoTokenizer.from_pretrained(model_id)
model = AutoModelForSeq2SeqLM.from_pretrained(model_id)

summarizer = pipeline("summarization", model=model, tokenizer=tokenizer)

chunks = [transcript[i:i+1024] for i in range(0, len(transcript), 1024)]
summary = ""
for chunk in chunks:
    out = summarizer(chunk, max_length=100, min_length=30, do_sample=False)
    summary += out[0]['summary_text'] + " "

print("\n✅ Summary:\n")
print(summary)