In [1]:
from transformers import pipeline

  from .autonotebook import tqdm as notebook_tqdm


In [23]:
classifier = pipeline('translation_en_to_de')

No model was supplied, defaulted to google-t5/t5-base and revision 686f1db (https://huggingface.co/google-t5/t5-base).
Using a pipeline without specifying a model name and revision in production is not recommended.
For now, this behavior is kept to avoid breaking backwards compatibility when padding/encoding with `truncation is True`.
- Be aware that you SHOULD NOT rely on google-t5/t5-base automatically truncating your input to 512 when padding/encoding.
- If you want to encode/pad to sequences longer than 512 you can either instantiate this tokenizer with `model_max_length` or pass `max_length` when encoding/padding.


In [24]:
res = classifier('In this tutorial, we will learn how to use the dashboards in the Grafana monitoring tool. We will also learn how to create a dashboard and add panels to it. We will also learn how to use the query editor to create queries and add them to')

In [25]:
res

[{'translation_text': 'In diesem Tutorial lernen wir, wie wir die Dashboards im Grafana Monitoring Tool verwenden, wie wir ein Dashboard erstellen und Panels hinzufügen, wie wir den Abfrageeditor verwenden, um Abfragen zu erstellen und hinzuzufügen.'}]

In [26]:
from transformers import AutoTokenizer, AutoModelForSequenceClassification

In [27]:
model_name = "distilbert-base-uncased-finetuned-sst-2-english"

In [28]:
model = AutoModelForSequenceClassification.from_pretrained(model_name)

In [29]:
tokenizer = AutoTokenizer.from_pretrained(model_name)

In [30]:
classifier = pipeline('sentiment-analysis', model=model, tokenizer=tokenizer)

In [31]:
res = classifier('I love you so much')

In [32]:
res

[{'label': 'POSITIVE', 'score': 0.9998691082000732}]

In [38]:
sequence = "Using tokenizers is easy and fun! --- \n is it? --\n explain?"

In [39]:
res = tokenizer(sequence)
res

{'input_ids': [101, 2478, 19204, 17629, 2015, 2003, 3733, 1998, 4569, 999, 1011, 1011, 1011, 2003, 2009, 1029, 1011, 1011, 4863, 1029, 102], 'attention_mask': [1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]}

In [35]:
res = tokenizer.tokenize(sequence)
res

['using', 'token', '##izer', '##s', 'is', 'easy', 'and', 'fun', '!']

In [40]:
import torch
import torch.nn.functional as F

In [41]:
X_train = ["Using tokenizers is easy and fun!", "I love you so much"]

In [42]:
res = classifier(X_train)
res

[{'label': 'POSITIVE', 'score': 0.999852180480957},
 {'label': 'POSITIVE', 'score': 0.9998691082000732}]

In [43]:
batch = tokenizer(X_train, padding=True, truncation=True, return_tensors="pt", max_length=512)

In [44]:
batch

{'input_ids': tensor([[  101,  2478, 19204, 17629,  2015,  2003,  3733,  1998,  4569,   999,
           102],
        [  101,  1045,  2293,  2017,  2061,  2172,   102,     0,     0,     0,
             0]]), 'attention_mask': tensor([[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1],
        [1, 1, 1, 1, 1, 1, 1, 0, 0, 0, 0]])}

In [46]:
with torch.no_grad():
    outputs = model(**batch)
    print(outputs)
    predictions = F.softmax(outputs.logits, dim=1)
    print(predictions)
    labels = torch.argmax(predictions, dim=1)
    print(labels)

SequenceClassifierOutput(loss=None, logits=tensor([[-4.2600,  4.5592],
        [-4.2905,  4.6509]]), hidden_states=None, attentions=None)
tensor([[1.4785e-04, 9.9985e-01],
        [1.3085e-04, 9.9987e-01]])
tensor([1, 1])


In [47]:
summarization = pipeline("summarization",model="facebook/bart-large-cnn")

In [49]:
text = """The tower is 324 metres (1,063 ft) tall, same height as an 81-storey building, and the tallest structure in Paris. Its base is square, measuring 125 metres (410 ft) on each side. During its construction, the Eiffel Tower surpassed the Washington Monument to become the tallest tower in the world, a title it held for 41 years until the Chrysler Building in New York City was finished in 1930. It was the first structure to reach a height of 300 metres. Due to the addition of a broadcasting aerial at the top of the tower in 1957, it is now taller than the Chrysler Building by 5.2 metres (17 ft). Excluding transmitters, the Eiffel Tower is the second tallest ."""
res = summarization(text, max_length=130, min_length=30, do_sample=False)
res

[{'summary_text': 'The tower is 324 metres (1,063 ft) tall, same height as an 81-storey building. Its base is square, measuring 125 metres (410 ft) on each side. It was the first structure to reach a height of 300 metres.'}]

In [1]:
from transformers import Trainer, TrainingArguments

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
training_args = TrainingArguments("test-trainer")

In [None]:
trainer = Trainer(
    model=model, args=training_args
)