## Import OpenAI client

In [1]:
from client import client

## Download sample data for transcription

In [2]:
from pathlib import Path
import requests

audio_file_path = Path("data/EarningsCall.wav")

if not audio_file_path.exists():
    # Download the audio file from link
    download_link = "https://cdn.openai.com/API/examples/data/EarningsCall.wav"
    Path("data").mkdir(exist_ok=True)
    print("Downloading audio file from link... ", end="")
    with open("data/EarningsCall.wav", "wb") as f:
        response = requests.get(download_link)
        f.write(response.content)
    print("Done.")

## Transcribe the audio file

In [6]:
audio_file = open(audio_file_path, "rb")
transcription = client.audio.transcriptions.create(
    model="whisper-1",
    file=audio_file,
)

print(transcription.text)

Good afternoon, everyone, and welcome to FinTech Plus Sync's second quarter 2023 earnings call. I'm John Doe, CEO of FinTech Plus. We've had a stellar Q2 with a revenue of $125 million, a 25% increase year over year. Our gross profit margin stands at a solid 58%, due in part to cost efficiencies gained from our scalable business model. Our EBITDA has surged to $37.5 million, translating to a remarkable 30% EBITDA margin. Our net income for the quarter rose to $16 million, which is a noteworthy increase from $10 million in Q2 2022. Our total addressable market has grown substantially, thanks to the expansion of our high-yield savings product line and the new RoboAdvisor platform. We've been diversifying our asset-backed securities portfolio, investing heavily in collateralized debt obligations and residential mortgage-backed securities. We've also invested $25 million in AAA-rated corporate bonds, enhancing our risk-adjusted returns. As for our balance sheet, total assets reached $1.5 b

## Transcribe and translate the hobbit file

In [3]:
hobbit_audio_file = Path("data/the hobbit.m4a")
assert hobbit_audio_file.exists()

In [4]:
# Trial 1 - no information about the language, transcription only
hobbit_trial_1 = client.audio.transcriptions.create(
    model="whisper-1",
    file=open(hobbit_audio_file, "rb"),
)

In [5]:
# The result is a translation to English of the original speech
hobbit_trial_1

Transcription(text="ההוביט, או לשם ובחזרה, הוא ספר פנטזיה מאת ג'ון רונאלד ראואל טולקין. הספר עוסק במסעו של ההוביט, בילבו בגינס, יחד עם חבורת גמדים, במטרה לשחרר את ממלכתם העבודה מאכיזתו של דרקון בשם סמוג. הספר מיועד בעיקר לילדים, למרות שהוא מכיל קטעים מפחידים שעלולים לתרוף את שנתם, אך נקרא על ידי בני כל הגילאים. בדומה לספר ההרפתקאות, אליס בארץ הפלאות, ספר זה נולד מסיפורים בהמשכים שנהג הסופר טולקין לספר לילדיו. טולקין היה פרופסור לבלשנות, לשון וספרות, וקיים את הטענה שהוא כתב את הספר כדי להדגים לסטודנטים כיצד ניתן ליצור הפעירה בעזרת מילים.")

In [6]:
# Trial 2 - use translations instead of transcriptions
hobbit_trial_2 = client.audio.translations.create(
    model="whisper-1",
    file=open(hobbit_audio_file, "rb"),
)

In [7]:
# The result is
hobbit_trial_2

Translation(text='The Hobbit is a fantasy book by John Ronald Reuel Tolkien. The book deals with the story of the Hobbit, Bilbo Baggins, together with a group of dwarves, in an attempt to free their kingdom from the grip of a dragon named Smaug. The book is mainly intended for children, even though it contains frightening details that may change over the years, but it is read by children of all ages. Similar to the book The Adventures of Alice in Wonderland, this book is born from stories that Tolkien used to tell his children. Tolkien was a linguist and a professor of literature, and there is a claim that he wrote the book to demonstrate to students how it can be created using words.')