# Transcriping Podcasts

### Step 1: Install Required Libraries


Install these packages if you haven't already:

In [None]:
pip install google-cloud-speech pydub


### Step 2: Convert MP3 to WAV (Google Cloud Speech prefers WAV format)

In [1]:
from pydub import AudioSegment

def convert_mp3_to_wav(mp3_file, wav_file):
    audio = AudioSegment.from_mp3(mp3_file)
    audio.export(wav_file, format="wav")


### Step 3: Transcribe with Google Cloud Speech-to-Text

In [None]:
from google.cloud import speech
import io

def transcribe_audio(wav_file):
    client = speech.SpeechClient()

    with io.open(wav_file, "rb") as audio_file:
        content = audio_file.read()

    audio = speech.RecognitionAudio(content=content)
    config = speech.RecognitionConfig(
        encoding=speech.RecognitionConfig.AudioEncoding.LINEAR16,
        language_code="en-US"
    )

    response = client.recognize(config=config, audio=audio)

    transcript = " ".join(result.alternatives[0].transcript for result in response.results)
    return transcript

# Usage
convert_mp3_to_wav("your_audio.mp3", "temp_audio.wav")
transcript = transcribe_audio("temp_audio.wav")

# Save transcript
with open("transcript.txt", "w") as file:
    file.write(transcript)
