# Task 2: Speech-to-Text System
This notebook demonstrates how to convert speech from an audio file into text using the SpeechRecognition library and Google Web Speech API.

In [1]:
!pip install SpeechRecognition pydub



In [3]:
import speech_recognition as sr
from pydub import AudioSegment



### Optional: Convert MP3 to WAV

In [5]:
def convert_mp3_to_wav(mp3_path, wav_path):
    sound = AudioSegment.from_mp3(mp3_path)
    sound.export(wav_path, format="wav")
    print(f"Converted {mp3_path} to {wav_path}")

# Example:
# convert_mp3_to_wav("sample.mp3", "sample.wav")

### Transcribe Audio

In [7]:
def transcribe_audio(file_path):
    recognizer = sr.Recognizer()
    try:
        with sr.AudioFile(file_path) as source:
            print("Listening to audio...")
            audio = recognizer.record(source)
        print("Transcribing...")
        text = recognizer.recognize_google(audio)
        print("\n🎧 Transcription Result:\n")
        print(text)
    except FileNotFoundError:
        print("❌ File not found. Please check the path and try again.")
    except sr.UnknownValueError:
        print("😕 Could not understand the audio.")
    except sr.RequestError as e:
        print(f"🚫 Could not request results from Google Speech Recognition service; {e}")

In [9]:
# Run this cell to start transcription
file_path = input("Enter path to your audio file (e.g., sample.wav): ")
transcribe_audio(file_path)

Enter path to your audio file (e.g., sample.wav):  /Users/sowmyapujari31/Downloads/file_example_WAV_1MG.wav


Listening to audio...
Transcribing...
😕 Could not understand the audio.
