In [None]:
! pip install -q transformers

[K     |████████████████████████████████| 4.0 MB 38.2 MB/s 
[K     |████████████████████████████████| 77 kB 7.8 MB/s 
[K     |████████████████████████████████| 895 kB 72.1 MB/s 
[K     |████████████████████████████████| 596 kB 88.4 MB/s 
[K     |████████████████████████████████| 6.6 MB 64.2 MB/s 
[?25h

In [12]:
# sentiment-analysis
from transformers import pipeline
classifier = pipeline("sentiment-analysis") # distilbert-base-uncased-finetuned-sst-2-english (default)
classifier(["I've been waiting for a Hugging Face course since many months","I don't hate it"])

No model was supplied, defaulted to distilbert-base-uncased-finetuned-sst-2-english (https://huggingface.co/distilbert-base-uncased-finetuned-sst-2-english)


[{'label': 'POSITIVE', 'score': 0.9690589308738708},
 {'label': 'POSITIVE', 'score': 0.9967384934425354}]

In [3]:
# The zero-shot-classification pipeline lets us select the labels for classification
from transformers import pipeline
classifier = pipeline("zero-shot-classification")  # facebook/bart-large-mnli (default)

classifier("This is a course about the Transformers library", candidate_labels=["education", "politics", "business"],)

No model was supplied, defaulted to facebook/bart-large-mnli (https://huggingface.co/facebook/bart-large-mnli)


{'labels': ['education', 'business', 'politics'],
 'scores': [0.8445995450019836, 0.111973837018013, 0.043426647782325745],
 'sequence': 'This is a course about the Transformers library'}

In [4]:
from transformers import pipeline
generator = pipeline("text-generation")
generator("In this course, we will teach you how to")

No model was supplied, defaulted to gpt2 (https://huggingface.co/gpt2)
Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


[{'generated_text': "In this course, we will teach you how to make a real-valued stock for the value of both your investment in it and the market's value.\n\nHow to Make a Realvalued Stock\n\nOn each day, I will teach you"}]

In [5]:
from transformers import pipeline
generator = pipeline("text-generation", model="distilgpt2")

generator("In this course, we will teach you how to",
  max_length=30, # Max length of generated sentences
  num_return_sequences=2) # number of sentences to be generated

Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


[{'generated_text': 'In this course, we will teach you how to control your own body, body. For example, if you are eating a good salad, it will'},
 {'generated_text': 'In this course, we will teach you how to use the technology we are getting ready to run in your community.\n\n\nAs part of our'}]

In [6]:
from transformers import pipeline
unmasker = pipeline("fill-mask")

unmasker("My <mask> is Vaasu", top_k=2) # Generating text by guessing the next word is one of the pre trained objective

No model was supplied, defaulted to distilroberta-base (https://huggingface.co/distilroberta-base)


[{'score': 0.6784117221832275,
  'sequence': 'My name is Vaasu',
  'token': 766,
  'token_str': ' name'},
 {'score': 0.0907612144947052,
  'sequence': 'My nickname is Vaasu',
  'token': 17911,
  'token_str': ' nickname'}]

In [11]:
#  The NER pipeline identifies entities such as persons, organizations or locations in a sentence.

from transformers import pipeline
ner = pipeline("ner", grouped_entities=True) # Name Entity Recognition

ner("My name is Sylvain and I work at Hugging Face in Brooklyn.")

# My name is Sylvain(PERSON) and I work at Hugging Face(ORGANIZAION) in Brooklyn(LOCATION).

No model was supplied, defaulted to dbmdz/bert-large-cased-finetuned-conll03-english (https://huggingface.co/dbmdz/bert-large-cased-finetuned-conll03-english)
  f'`grouped_entities` is deprecated and will be removed in version v5.0.0, defaulted to `aggregation_strategy="{aggregation_strategy}"` instead.'


[{'end': 18,
  'entity_group': 'PER',
  'score': 0.9981694,
  'start': 11,
  'word': 'Sylvain'},
 {'end': 45,
  'entity_group': 'ORG',
  'score': 0.9796019,
  'start': 33,
  'word': 'Hugging Face'},
 {'end': 57,
  'entity_group': 'LOC',
  'score': 0.9932106,
  'start': 49,
  'word': 'Brooklyn'}]

In [8]:
from transformers import pipeline
summarizer = pipeline("summarization")
summarizer('''
America has changed dramatically during recent years. Not only has the number of
graduates in traditional engineering disciplines such as mechanical, civil,
electrical, chemical, and aeronautical engineering declined, but in most of
the premier American universities engineering curricula now concentrate on
and encourage largely the study of engineering science. As a result, there
are declining offerings in engineering subjects dealing with infrastructure,
the environment, and related issues, and greater concentration on high
technology subjects, largely supporting increasingly complex scientific
developments. While the latter is important, it should not be at the expense
of more traditional engineering.
Rapidly developing economies such as China and India, as well as other
industrial countries in Europe and Asia, continue to encourage and advance
the teaching of engineering. Both China and India, respectively, graduate
six and eight times as many traditional engineers as does the United States.
Other industrial countries at minimum maintain their output, while America
suffers an increasingly serious decline in the number of engineering graduates
and a lack of well-educated engineers.
''')

No model was supplied, defaulted to sshleifer/distilbart-cnn-12-6 (https://huggingface.co/sshleifer/distilbart-cnn-12-6)


[{'summary_text': ' America has changed dramatically during recent years . The number of engineering graduates in the U.S. has declined in traditional engineering disciplines such as mechanical, civil, electrical, chemical, and aeronautical engineering . Rapidly developing economies such as China and India, as well as other industrialized countries, continue to encourage and advance the teaching of engineering .'}]

In [22]:
! pip install -q datasets transformers[sentencepiece]



In [None]:
!pip install sentencepiece

In [9]:
from transformers import pipeline

translator = pipeline("translation", model="Helsinki-NLP/opus-mt-fr-en") # needs sentencepiece

translator("Ce cours est produit par Hugging Face.") #restart enviroment will work

[{'translation_text': 'This course is produced by Hugging Face.'}]