# 🎤 Voice Recognition & Speech-to-Text Converter
Built in Google Colab using Python

This project takes an audio file (e.g., `.wav`, `.mp3`) and converts the spoken words into text.

In [None]:
# ✅ Install necessary libraries
!pip install SpeechRecognition pydub

In [None]:
# ✅ Upload your audio file (WAV or MP3)
from google.colab import files
uploaded = files.upload()

In [None]:
# ✅ Convert speech to text
import speech_recognition as sr
from pydub import AudioSegment

audio_file = next(iter(uploaded))
if audio_file.endswith('.mp3'):
    sound = AudioSegment.from_mp3(audio_file)
    wav_file = audio_file.replace('.mp3', '.wav')
    sound.export(wav_file, format="wav")
else:
    wav_file = audio_file

recognizer = sr.Recognizer()
with sr.AudioFile(wav_file) as source:
    audio_data = recognizer.record(source)
    try:
        text = recognizer.recognize_google(audio_data)
        print("📝 Transcribed Text:\n", text)
    except sr.UnknownValueError:
        print("❗ Could not understand audio.")
    except sr.RequestError:
        print("❗ Google API unavailable.")

In [None]:
# ✅ (Optional) Text-to-Speech conversion
from gtts import gTTS
from IPython.display import Audio

tts = gTTS("This is the transcribed text being read aloud.")
tts.save("output.mp3")
Audio("output.mp3")