In [1]:
# ==============================
# STEP 1: Install Resemble SDK
# ==============================
!pip install resemble
!pip install SpeechRecognition pydub

Collecting resemble
  Downloading resemble-1.7.0-py3-none-any.whl.metadata (4.1 kB)
Downloading resemble-1.7.0-py3-none-any.whl (9.1 kB)
Installing collected packages: resemble
Successfully installed resemble-1.7.0


In [2]:
# ==============================
# STEP 2: Authenticate with API
# ==============================
from resemble import Resemble

# 🔑 Set your API key
Resemble.api_key("LFWtB2TSzLAfJB5fvZ37wQtt")

print("✅ Resemble API authenticated successfully!")


✅ Resemble API authenticated successfully!


In [3]:
# ==============================
# STEP 3: Get Project and Voice
# ==============================
# Get default project
project_uuid = Resemble.v2.projects.all(1, 10)['items'][0]['uuid']
print("📂 Project UUID:", project_uuid)

# Get default voice
voice_uuid = Resemble.v2.voices.all(1, 10)['items'][0]['uuid']
print("🎙️ Voice UUID:", voice_uuid)


📂 Project UUID: 1e6a79ce
🎙️ Voice UUID: 28f1626c


In [4]:
# ==============================
# STEP 4: Upload an Audio File
# ==============================
from google.colab import files

print("📤 Upload your audio file (e.g., speech.wav, speech.mp3)")
uploaded = files.upload()

# Get uploaded file name
input_audio = list(uploaded.keys())[0]
print("✅ Uploaded:", input_audio)


📤 Upload your audio file (e.g., speech.wav, speech.mp3)


Saving clip-Bilal's Rapid Voice Clone 1-2025_08_31.wav to clip-Bilal's Rapid Voice Clone 1-2025_08_31.wav
✅ Uploaded: clip-Bilal's Rapid Voice Clone 1-2025_08_31.wav


In [6]:
# ==============================
# STEP 5: Transcribe Uploaded Audio
# (Convert input audio → text)
# ==============================
import speech_recognition as sr

recognizer = sr.Recognizer()

with sr.AudioFile(input_audio) as source:
    audio = recognizer.record(source)

# Convert speech → text
transcribed_text = recognizer.recognize_google(audio)
print("📝 Transcribed Text:", transcribed_text)


Collecting SpeechRecognition
  Downloading speechrecognition-3.14.3-py3-none-any.whl.metadata (30 kB)
Downloading speechrecognition-3.14.3-py3-none-any.whl (32.9 MB)
[2K   [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m32.9/32.9 MB[0m [31m31.7 MB/s[0m eta [36m0:00:00[0m
[?25hInstalling collected packages: SpeechRecognition
Successfully installed SpeechRecognition-3.14.3
📝 Transcribed Text: do a sunlight Forest a curious Fox with a fluffy tail and bright glimmering eyes darted between the trees it's Tiny Paws leaving soft imprints on the mossy ground hosing to sniff a patch of wildflowers it tilted its head listening to the distant sherp of a bird as if the entire Forest were a Melody it alone could understand


In [9]:
# ==============================
# STEP 6: Generate in Your Voice
# ==============================
response = Resemble.v2.clips.create_sync(
    project_uuid,
    voice_uuid,
    transcribed_text,
    title="Converted Speech"
)

# Extract audio URL
clip_url = response['item']['audio_src']
print("🔗 Cloned Audio URL:", clip_url)


🔗 Cloned Audio URL: https://app.resemble.ai/rails/active_storage/blobs/redirect/eyJfcmFpbHMiOnsibWVzc2FnZSI6IkJBaHBCTWlzbkE4PSIsImV4cCI6bnVsbCwicHVyIjoiYmxvYl9pZCJ9fQ==--3a9e97f7c650ca13ab920493dd31a15ebc518719/Converted+Speech.wav


In [10]:
# ==============================
# STEP 7: Download & Play Result
# ==============================
import requests
from IPython.display import Audio

# Download result
output_file = "cloned_voice.wav"
r = requests.get(clip_url)
with open(output_file, "wb") as f:
    f.write(r.content)

print("✅ Cloned audio saved as:", output_file)
Audio(output_file)


✅ Cloned audio saved as: cloned_voice.wav
