# Audio to Text using Hugging Face Transformers
This notebook demonstrates how to use the `transformers` library to convert audio to text using the OpenAI Whisper model.

In [None]:
# Install necessary libraries if not present
%pip install transformers torch torchaudio librosa

In [None]:
from transformers import pipeline
import torch

# Check for GPU
device = "cuda" if torch.cuda.is_available() else "cpu"
print(f"Using device: {device}")

In [None]:
# Initialize the ASR pipeline
# We use 'openai/whisper-small' for a good balance of speed and accuracy
transcriber = pipeline("automatic-speech-recognition", model="openai/whisper-small", device=device)
print("Model loaded successfully!")

In [None]:
# Example: Transcribe a sample audio file

def transcribe_audio(file_path):
    try:
        # The pipeline handles loading and resampling automatically
        result = transcriber(file_path)
        return result["text"]
    except Exception as e:
        return f"Error: {e}"

# User File
AUDIO_FILENAME = r"C:\Users\HP\Downloads\WhatsApp Audio 2026-01-06 at 5.19.54 PM.mp4"

print(f"Processing {AUDIO_FILENAME}...")
text = transcribe_audio(AUDIO_FILENAME)
print("\n--- Transcription ---\n")
print(text)