# Test Whisper on Single File

Verify Whisper works with one audio file before batch processing.

In [None]:
import whisper
from src.voice_eval.config import load_config

In [None]:
model_name = load_config('whisper', 'model')
language = load_config('whisper', 'language')
audio_dir = load_config('input', 'audio_dir')

print(f"Loading Whisper model: {model_name}")
print(f"Language: {language}")
print(f"Audio directory: {audio_dir}")

In [None]:
model = whisper.load_model(model_name)
print(f"✓ Model loaded successfully")

In [None]:
test_file = f"{audio_dir}/+917259326110_Fakkirswami S V.aac"
print(f"Transcribing: {test_file}\n")

In [None]:
result = model.transcribe(
    test_file,
    language=language,
    verbose=True
)

In [None]:
print("\n" + "="*60)
print("FULL TRANSCRIPTION:")
print("="*60)
print(result["text"])

In [None]:
print("\n" + "="*60)
print("TIMESTAMPED SEGMENTS (first 5):")
print("="*60)
for segment in result["segments"][:5]:
    print(f"[{segment['start']:.1f}s -> {segment['end']:.1f}s]")
    print(f"  {segment['text']}")

print(f"\nTotal segments: {len(result['segments'])}")