# Inference examples

In [2]:
# Do not forget to install all dependencies first:
!pip  install -Uqq WhisperSpeech==0.8.9 webdataset

In [None]:
def is_colab():
    try: import google.colab; return True
    except: return False

import torch
if not torch.cuda.is_available():
    if is_colab(): raise BaseException("Please change the runtime type to GPU. In the menu: Runtime -> Change runtime type (the free T4 instance is enough)")
    else:          raise BaseException("Currently the example notebook requires CUDA, make sure you are running this on a machine with a GPU.")

In [4]:
%load_ext autoreload
%autoreload 2

In [5]:
import torch
import torch.nn.functional as F

from IPython.display import Markdown, HTML

## The whole pipeline

In [None]:
# check "7. Pipeline.ipynb"
from whisperspeech.pipeline import Pipeline

In [None]:
pipe = Pipeline(t2s_ref='whisperspeech/whisperspeech:t2s-v1.95-small-8lang.model', s2a_ref='whisperspeech/whisperspeech:s2a-v1.95-medium-7lang.model')

In [None]:
pipe.generate_to_notebook("""
This is the first demo of Whisper Speech, a fully open source text-to-speech model trained by Collabora and Lion on the Juwels supercomputer.
""")

In [None]:
# The model knows how to speak Polish
pipe.generate_to_notebook("""
Maria Salomea Skłodowska-Curie, polsko-francuska uczona w dziedzinach fizyki doświadczalnej i chemii fizycznej, podwójna noblistka, laureatka Nagrody Nobla z fizyki i chemii.
""", lang='pl')

In [None]:
# The model also knows how to speak German
pipe.generate_to_notebook("""
Johannes Gutenberg gilt als Erfinder des modernen Buchdrucks mit beweglichen Metalllettern, Mobilletterndruck, und der Druckerpresse. Er wurde ca. am 24. Juni in seinem Geburtsjahr getauft. Die Verwendung von beweglichen Lettern ab 1450 revolutionierte die herkömmliche Methode der Buchproduktion, das Abschreiben von Hand, und löste in Europa eine Medienrevolution aus.
""", lang='de')

In [None]:
# The model also knows how to speak French
pipe.generate_to_notebook("""
Second enfant de Charles Bonaparte et Letizia Ramolino, Napoléon Bonaparte devient en 1793 général dans les armées de la Première République française, née de la Révolution, où il est notamment commandant en chef de l'armée d'Italie puis de l'armée d'Orient.
""", lang='fr')

In [None]:
# The model also knows how to speak Italian
pipe.generate_to_notebook("""
Maria Montessori è stata una pedagogista, educatrice e medica italiana, internazionalmente nota per il metodo educativo che prende il suo nome, adottato in migliaia di scuole dell'infanzia, elementari, medie e superiori in tutto il mondo. Fu tra le prime donne a laurearsi in medicina in Italia.
""", lang='it')

In [None]:
# The model also knows how to speak Dutch
pipe.generate_to_notebook("""
Meisje met de parel is een schilderij uit circa 1665-1667 van de Hollandse meester Johannes Vermeer. Het is uitgegroeid tot diens populairste schilderij. Meisje met de parel kwam in 1902 in het bezit van het Mauritshuis in Den Haag.
""", lang='nl')

In [None]:
# The model also knows how to speak Spanish
pipe.generate_to_notebook("""
Pablo Ruiz Picasso fue un pintor y escultor español, creador, junto con Georges Braque, del cubismo. Es considerado desde la génesis del siglo XX como uno de los mayores pintores que participaron en los variados movimientos artísticos que se propagaron por el mundo y ejercieron una gran influencia en otros grandes artistas de su tiempo.
""", lang='es')

In [None]:
# The model also knows how to speak Portuguese
pipe.generate_to_notebook("""
Vasco da Gama foi um navegador e explorador português. Na Era dos Descobrimentos, destacou-se por ter sido o comandante dos primeiros navios a navegar da Europa à Índia, na mais longa viagem oceânica até então realizada, superior a uma volta completa ao mundo pelo Equador No fim da vida foi, por um breve período, Vice-Rei da Índia.
""", lang='pt')

## Voice cloning

In [None]:
# we can give it an audio file reference to get zero-shot voice cloning
#
# you can provide a URL or upload your own audio files
pipe.generate_to_notebook("""
This is the first demo of Whisper Speech, a fully open source text-to-speech model trained by Collabora and Lion on the Juwels supercomputer.
""", lang='en', cps=10.5, speaker='https://upload.wikimedia.org/wikipedia/commons/7/75/Winston_Churchill_-_Be_Ye_Men_of_Valour.ogg')

In [None]:
# it works even better (but slower) with the HQ model
pipe = Pipeline()

In [None]:
pipe.generate_to_notebook("""
This is the first demo of Whisper Speech, a fully open source text-to-speech model trained by Collabora and Lion on the Juwels supercomputer.
""", lang='en', cps=10, speaker='https://upload.wikimedia.org/wikipedia/commons/7/75/Winston_Churchill_-_Be_Ye_Men_of_Valour.ogg')