In [7]:
# Installing transformers architecture
!pip install transformers

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/


In [8]:
#importing the pipeline function
from transformers import pipeline

In [9]:
#working with sentiment-analysis pipeline
text = pipeline("sentiment-analysis")
text(" All the faith he had had had had no effect on the outcome of his life.")

No model was supplied, defaulted to distilbert-base-uncased-finetuned-sst-2-english and revision af0f99b (https://huggingface.co/distilbert-base-uncased-finetuned-sst-2-english).
Using a pipeline without specifying a model name and revision in production is not recommended.


[{'label': 'NEGATIVE', 'score': 0.9965454936027527}]

In [10]:
#working with zero-shot-classification pipeline
zsc = pipeline("zero-shot-classification")
zsc("One morning I shot an elephant in my pajamas. How he got into my pajamas I’ll never know.", candidate_labels=["animals","dress","nature","weather"])

No model was supplied, defaulted to facebook/bart-large-mnli and revision c626438 (https://huggingface.co/facebook/bart-large-mnli).
Using a pipeline without specifying a model name and revision in production is not recommended.


{'sequence': 'One morning I shot an elephant in my pajamas. How he got into my pajamas I’ll never know.',
 'labels': ['animals', 'nature', 'dress', 'weather'],
 'scores': [0.9651063084602356,
  0.02169850468635559,
  0.00973573513329029,
  0.0034594836179167032]}

In [11]:
#working with text-generation pipeline
text_gen = pipeline("text-generation")
text_gen("Natural Language is a powerfull ")

No model was supplied, defaulted to gpt2 and revision 6c0e608 (https://huggingface.co/gpt2).
Using a pipeline without specifying a model name and revision in production is not recommended.
Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


[{'generated_text': "Natural Language is a powerfull vernacular. People who understand it are capable of feeling it all they want. It has been used by people for millennia. People who don't have the time to learn it have a deep appreciation of its beauty and"}]

In [16]:
#encoding and loading the model
from transformers import AutoTokenizer
trans = AutoTokenizer.from_pretrained("bert-base-cased")
text = "I’ve been waiting for a HuggingFace course my whole life.” and “I hate this so much!"
encode_text = trans.tokenize(text)
print(encode_text)

['I', '’', 've', 'been', 'waiting', 'for', 'a', 'Hu', '##gging', '##F', '##ace', 'course', 'my', 'whole', 'life', '.', '”', 'and', '“', 'I', 'hate', 'this', 'so', 'much', '!']


In [24]:
#coverting tokens to input ids
ids = trans.convert_tokens_to_ids(encode_text)
print(ids)


[146, 787, 1396, 1151, 2613, 1111, 170, 20164, 10932, 2271, 7954, 1736, 1139, 2006, 1297, 119, 790, 1105, 789, 146, 4819, 1142, 1177, 1277, 106]


In [25]:
#saving the model
save = trans.save_pretrained("on_my_system")
print(save)

('on_my_system/tokenizer_config.json', 'on_my_system/special_tokens_map.json', 'on_my_system/vocab.txt', 'on_my_system/added_tokens.json', 'on_my_system/tokenizer.json')


In [26]:
#decode the model
decode = trans.decode(ids)
print(decode)

I ’ ve been waiting for a HuggingFace course my whole life. ” and “ I hate this so much!
