In [5]:
from google.cloud.speech_v2 import SpeechClient
from google.cloud.speech_v2.types import cloud_speech


def quickstart_v2(
    project_id: str,
    audio_file: str,
) -> cloud_speech.RecognizeResponse:
    """Transcribe an audio file."""
    # Instantiates a client
    client = SpeechClient()

    # Reads a file as bytes
    with open(audio_file, "rb") as f:
        content = f.read()

    config = cloud_speech.RecognitionConfig(
        auto_decoding_config={}, language_codes=["en-US"], model="latest_long"
    )

    request = cloud_speech.RecognizeRequest(
        recognizer=f"projects/{project_id}/locations/global/recognizers/_",
        config=config,
        content=content,
    )

    # Transcribes the audio into text
    response = client.recognize(request=request)

    for result in response.results:
        print(f"Transcript: {result.alternatives[0].transcript}")

    return response


my_project_id = "adroit-metric-384510"

In [6]:
my_audio_file = "myAudio.mp3"

responseFromGoogle = quickstart_v2(my_project_id, my_audio_file)

Transcript: so far
Transcript:  as the ultimate goal is concerned
Transcript:  I think none of us
Transcript:  need have any apprehensions none of us need have any doubt
Transcript:  but my fear which I must Express clearly
Transcript:  is this
Transcript:  our difficulty as I said is not about the ultimate future
Transcript:  our difficulty is


In [7]:
responseFromGoogle

results {
  alternatives {
    transcript: "so far"
    confidence: 0.971142173
  }
  result_end_offset {
    seconds: 2
    nanos: 110000000
  }
  language_code: "en-US"
}
results {
  alternatives {
    transcript: " as the ultimate goal is concerned"
    confidence: 0.966914356
  }
  result_end_offset {
    seconds: 4
    nanos: 840000000
  }
  language_code: "en-US"
}
results {
  alternatives {
    transcript: " I think none of us"
    confidence: 0.966946781
  }
  result_end_offset {
    seconds: 7
    nanos: 50000000
  }
  language_code: "en-US"
}
results {
  alternatives {
    transcript: " need have any apprehensions none of us need have any doubt"
    confidence: 0.956716359
  }
  result_end_offset {
    seconds: 12
    nanos: 660000000
  }
  language_code: "en-US"
}
results {
  alternatives {
    transcript: " but my fear which I must Express clearly"
    confidence: 0.969098568
  }
  result_end_offset {
    seconds: 16
    nanos: 870000000
  }
  language_code: "en-US"
}
resul

In [8]:
audioTranscript = ''.join(result.alternatives[0].transcript
                          for result in responseFromGoogle.results)
print(audioTranscript)

so far as the ultimate goal is concerned I think none of us need have any apprehensions none of us need have any doubt but my fear which I must Express clearly is this our difficulty as I said is not about the ultimate future our difficulty is
