In [13]:
pip install SpeechRecognition pydub pandas

Collecting pydub
  Downloading pydub-0.25.1-py2.py3-none-any.whl (32 kB)
Installing collected packages: pydub
Successfully installed pydub-0.25.1


In [None]:
import speech_recognition as sr
import re
import os
import pandas as pd

def extract_text_from_audio(audio_path):
    try:
        r = sr.Recognizer()
        with sr.AudioFile(audio_path) as source:
            audio_data = r.record(source)
            transcribed_text = r.recognize_google(audio_data, language='hi-IN')

        return transcribed_text
    except Exception as e:
        print(f"Error in extracting text: {e}")
        return None

def clean_text(text):
    text = text.lower()
    text = re.sub(r'\W+', ' ', text)
    return text

def load_data(folder_path):
    data = []
    for filename in os.listdir(folder_path):
        if filename.endswith('.wav'):
            file_path = os.path.join(folder_path, filename)
            transcribed_text = extract_text_from_audio(file_path)
            cleaned_text = clean_text(transcribed_text)
            data.append({'file_name': filename, 'transcribed_text': cleaned_text})

    return pd.DataFrame(data)

def save_data(df, file_path):
    df.to_csv(file_path, index=False)

folder_path = "https://repository.voxforge1.org/downloads/SpeechCorpus/Trunk/Audio/Original/44.1kHz_16bit/"
output_file_path = "cleaned_audio_data.csv"

df = load_data(folder_path)
save_data(df, output_file_path)

print(f"Cleaned data saved to {output_file_path}")