<a href="https://colab.research.google.com/github/TSGUSA/Transcription-whisper/blob/main/transcription.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
# Install dependencies
!pip install -q openai-whisper ffmpeg-python

# Import required libraries
import whisper
import torch
import gc
from google.colab import files

# Clear GPU memory to prevent memory issues
torch.cuda.empty_cache()
gc.collect()

# Welcome message
print("🌟 Welcome to the Whisper Transcription Tool! 🌟")
print("This tool will transcribe your audio file into text using OpenAI's Whisper model.")
print("Please upload an audio file (MP3, WAV, M4A, etc.) when prompted.\n")

# Upload an audio file
print("📂 Step 1: Upload your audio file")
uploaded = files.upload()
audio_file = list(uploaded.keys())[0]  # Get the uploaded file name
print(f"✅ File '{audio_file}' uploaded successfully!\n")

# Load the Whisper model
print("🤖 Step 2: Loading the Whisper model...")
model = whisper.load_model("large-v3-turbo")  # Use "base" for faster results; change to "medium" or "large" for better accuracy
print("✅ Model loaded successfully!\n")

# Transcribe the uploaded audio file
print("🎙️ Step 3: Transcribing your audio file...")
print("This may take a while depending on the size of the file and the model you selected.")
print("Please wait...\n")

# Transcribe with verbose output for progress updates
result = model.transcribe(audio_file, verbose=True)

# Print the transcribed text
print("\n🎉 Transcription Complete! Here's the result:\n")
print(result["text"])

# Save the transcription to a text file
output_file = audio_file + "_transcription.txt"
with open(output_file, "w", encoding="utf-8") as f:
    f.write(result["text"])

print(f"\n💾 Transcription saved to '{output_file}' in your Colab workspace.")

# Automatically download the transcription file
files.download(output_file)
print(f"📥 File '{output_file}' has been downloaded automatically.")