from https://huggingface.co/docs/transformers/pipeline_tutorial

In [None]:
from datasets import load_dataset
from transformers import pipeline
from transformers import AutoTokenizer, AutoModelForCausalLM, AutoModelForSequenceClassification
import torch

In [None]:
generator = pipeline(task="text-generation")

In [None]:
generator(
    [
        "Three Rings for the Elven-kings under the sky, Seven for the Dwarf-lords in their halls of stone",
        "Nine for Mortal Men, doomed to die, One for the Dark Lord on his dark throne",
    ]
)  # doctest: +SKIP

In [None]:
generator(["when rabbit asked if he'd like honey or milk with his bread, Pooh said"], num_return_sequences=2)

In [None]:
classifier = pipeline("sentiment-analysis")
classifier("We are very happy to show you the 🤗 Transformers library.")

In [None]:
phrases = ['this really sucks', 'i love you', 'this is factual with no bias', 'the quick brown fox jumped over the yellow dog']
results = classifier(phrases)
for result in results:
    print(f"label: {result['label']}, with score: {round(result['score'], 4)}")

In [None]:
model_name = "nlptown/bert-base-multilingual-uncased-sentiment"
model = AutoModelForSequenceClassification.from_pretrained(model_name)
tokenizer = AutoTokenizer.from_pretrained(model_name)
classifier = pipeline("sentiment-analysis", model=model, tokenizer=tokenizer)
classifier("Nous sommes très heureux de vous présenter la bibliothèque 🤗 Transformers.")

In [None]:
tokenizer = AutoTokenizer.from_pretrained("distilgpt2")
model = AutoModelForCausalLM.from_pretrained("distilgpt2")
generator = pipeline(task="text-generation", model=model, tokenizer=tokenizer)
generator(["when rabbit asked if he'd like honey or milk with his bread, Pooh said"], num_return_sequences=2)

In [None]:
torch.manual_seed(42)
ds = load_dataset("hf-internal-testing/librispeech_asr_demo", "clean", "validation")
audio_file = ds['validation'][1]["audio"]["path"]
audio_classifier = pipeline(task="audio-classification", model="ehcalabres/wav2vec2-lg-xlsr-en-speech-emotion-recognition")
preds = audio_classifier(audio_file)
preds

In [None]:
vision_classifier = pipeline(task="image-classification")
preds = vision_classifier(images="https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/pipeline-cat-chonk.jpeg")
preds = [{"score": round(pred["score"], 4), "label": pred["label"]} for pred in preds]
preds

In [None]:
image = "https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/pipeline-cat-chonk.jpeg"
image = "https://content.gallup.com/origin/gallupinc/GallupSpaces/Production/Cms/TGBCMS/iy1ex3cookmf9cme5qlnxa.jpg"
image = 'https://media.istockphoto.com/id/1328887289/photo/happy-dog.jpg?b=1&s=170667a&w=0&k=20&c=mp3L73BC14QUuk1EQaYtZ1-wwJRW9HAffcsGZNyMy_o='
question = "Where is the cat?"
question = "Are these people?"
question = 'How many people?'
question = 'What is the dog wearing?'
vqa = pipeline(task="vqa")
preds = vqa(image=image, question=question)
preds = [{"score": round(pred["score"], 4), "answer": pred["answer"]} for pred in preds]
preds

In [None]:
tokenizer = AutoTokenizer.from_pretrained("bert-base-uncased")
sequence = "In a hole in the ground there lived a hobbit."
print(tokenizer(sequence))
print(tokenizer.decode(tokenizer(sequence)['input_ids']))
sequence =  "A hobbit lived in a hole in the ground"
print(tokenizer(sequence))
print(tokenizer.decode(tokenizer(sequence)['input_ids']))

In [None]:
dataset = load_dataset("PolyAI/minds14", name="en-US", split="train")

In [None]:
dataset[0]["audio"]['array'].shape