<a href="https://colab.research.google.com/github/MatteoRigoni/LLMs_Projects/blob/master/HuggingFace_Pipeline_Base_Samples.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [None]:
!pip install -q transformers datasets diffusers

In [None]:
import torch
from transformers import pipeline
from diffusers import DiffusionPipeline
from datasets import load_dataset
import soundfile as f
from IPython.display import Audio

In [None]:
#Sentiment Analysis
classifier = pipeline("sentiment-analysis") # default one
result = classifier("I hate you")
print(result)

In [None]:
#Named Entitiy Recognition
ner_tagger = pipeline("ner", grouped_entities=True)
result = ner_tagger("My name is Sylvain and I work at Hugging Face in Brooklyn.")
print(result)

In [None]:
#Question Answering with Context
question_answerer = pipeline("question-answering")
result = question_answerer(
    question="Where do I work?",
    context="My name is Sylvain and I work at Hugging Face in Brooklyn",
)
print(result)

In [None]:
#Text Summaritation
summarizer = pipeline("summarization")
text = """In our modern, information-heavy world, processing large amounts of text efficiently is crucial. This AI-powered tool is specifically designed for professionals, students, and researchers who frequently need to extract key details from lengthy documents."""
result = summarizer(text)
print(result)

In [None]:
#Translation
translator = pipeline("translation", model="Helsinki-NLP/opus-mt-fr-en")
result = translator("Ce cours est produit par Hugging Face.")
print(result)

In [None]:
#Classification
classifier = pipeline("zero-shot-classification")
result = classifier(
    "This is a course about the Transformers library",
    candidate_labels=["education", "politics", "business"],
)
print(result)

In [None]:
#Text Generation
generator = pipeline("text-generation")
result = generator("In this course, we will teach you how to use pipeline")
print(result)

In [None]:
# Image Generation

image_gen = DiffusionPipeline.from_pretrained(
    "stabilityai/stable-diffusion-2",
    torch_dtype=torch.float16,
    use_safetensors=True,
    variant="fp16"
    ).to("cuda")

text = "A class of Data Scientists learning about AI, in the surreal style of Salvador Dali"
image = image_gen(prompt=text).images[0]
image

In [None]:
# Audio Generation

synthesiser = pipeline("text-to-speech", "microsoft/speecht5_tts", device='cuda')

embeddings_dataset = load_dataset("Matthijs/cmu-arctic-xvectors", split="validation")
speaker_embedding = torch.tensor(embeddings_dataset[7306]["xvector"]).unsqueeze(0)

speech = synthesiser("Hi to an artificial intelligence engineer, on the way to mastery!", forward_params={"speaker_embeddings": speaker_embedding})

sf.write("speech.wav", speech["audio"], samplerate=speech["sampling_rate"])
Audio("speech.wav")