# Hugging Face

## 이선우 (20223888)

In [1]:
from transformers import pipeline

## Sentiment Analysis

In [22]:
classifier = pipeline('sentiment-analysis')

No model was supplied, defaulted to distilbert-base-uncased-finetuned-sst-2-english (https://huggingface.co/distilbert-base-uncased-finetuned-sst-2-english)


In [23]:
text = [
    "Fly me to the moon, and let me play among the stars",
    "April is the cruellest month, breeding Lilacs out of the dead land."
]

In [24]:
classifier(text)

[{'label': 'POSITIVE', 'score': 0.9996751546859741},
 {'label': 'NEGATIVE', 'score': 0.9489613771438599}]

## Zero-shot classification

(Few-shot classification)

GPT : Generative Pre-Trained language model

In [25]:
classifier = pipeline('zero-shot-classification')

No model was supplied, defaulted to facebook/bart-large-mnli (https://huggingface.co/facebook/bart-large-mnli)


In [26]:
text = [
    "German finance minister urges EU to rein in public spending",
    "China seeks more island security pacts to boost clout in Pacific"
]

In [27]:
classifier(
    text,
    candidate_labels=[
        'education', 'politics', 'business',
        'economy', 'europe', 'asia'
    ]
)

[{'sequence': 'German finance minister urges EU to rein in public spending',
  'labels': ['europe', 'politics', 'economy', 'business', 'education', 'asia'],
  'scores': [0.40189388394355774,
   0.2552807033061981,
   0.24059978127479553,
   0.07709541916847229,
   0.016165118664503098,
   0.008965007029473782]},
 {'sequence': 'China seeks more island security pacts to boost clout in Pacific',
  'labels': ['politics', 'asia', 'business', 'economy', 'europe', 'education'],
  'scores': [0.5034076571464539,
   0.27671101689338684,
   0.14557312428951263,
   0.033448345959186554,
   0.02069881558418274,
   0.020161081105470657]}]

## Text Generation

In [28]:
generator = pipeline('text-generation')

No model was supplied, defaulted to gpt2 (https://huggingface.co/gpt2)


In [29]:
# "The Myth of Sisyphus" by Albert Camus
text = "There is but one truly serious philosophical problem, and that is suicide. Judging"

In [30]:
generator(text, max_lenght=256)

Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


[{'generated_text': 'There is but one truly serious philosophical problem, and that is suicide. Judging by what I have seen, it is an irrational problem…and one where there is a clear conflict between man and the Universe: whether it is true or not…or whether'}]

## Mask filling

In [31]:
unmasker = pipeline('fill-mask')

No model was supplied, defaulted to distilroberta-base (https://huggingface.co/distilroberta-base)


In [32]:
# Billie Eilish
text = "So you're a <mask> guy, Like it really rough guy"

In [33]:
unmasker(text)

[{'score': 0.9274505972862244,
  'token': 6744,
  'token_str': ' rough',
  'sequence': "So you're a rough guy, Like it really rough guy"},
 {'score': 0.030521560460329056,
  'token': 1828,
  'token_str': ' tough',
  'sequence': "So you're a tough guy, Like it really rough guy"},
 {'score': 0.001765676774084568,
  'token': 1099,
  'token_str': ' bad',
  'sequence': "So you're a bad guy, Like it really rough guy"},
 {'score': 0.001683201640844345,
  'token': 15455,
  'token_str': ' nasty',
  'sequence': "So you're a nasty guy, Like it really rough guy"},
 {'score': 0.0015438725240528584,
  'token': 543,
  'token_str': ' hard',
  'sequence': "So you're a hard guy, Like it really rough guy"}]

## NER (Named Entity Recognition)

In [34]:
ner = pipeline('ner')

No model was supplied, defaulted to dbmdz/bert-large-cased-finetuned-conll03-english (https://huggingface.co/dbmdz/bert-large-cased-finetuned-conll03-english)


In [35]:
text = "Steven Paul Jobs (February 24, 1955 – October 5, 2011) was an American entrepreneur, inventor, business magnate, media proprietor, and investor. He was the co-founder, chairman, and CEO of Apple; the chairman and majority shareholder of Pixar; a member of The Walt Disney Company's board of directors following its acquisition of Pixar; and the founder, chairman, and CEO of NeXT. He is widely recognized as a pioneer of the personal computer revolution of the 1970s and 1980s, along with his early business partner and fellow Apple co-founder Steve Wozniak."

In [36]:
ner(text)

[{'entity': 'I-PER',
  'score': 0.99945754,
  'index': 1,
  'word': 'Steven',
  'start': 0,
  'end': 6},
 {'entity': 'I-PER',
  'score': 0.9994562,
  'index': 2,
  'word': 'Paul',
  'start': 7,
  'end': 11},
 {'entity': 'I-PER',
  'score': 0.999501,
  'index': 3,
  'word': 'Job',
  'start': 12,
  'end': 15},
 {'entity': 'I-PER',
  'score': 0.99722654,
  'index': 4,
  'word': '##s',
  'start': 15,
  'end': 16},
 {'entity': 'I-MISC',
  'score': 0.9967591,
  'index': 18,
  'word': 'American',
  'start': 62,
  'end': 70},
 {'entity': 'I-ORG',
  'score': 0.9993734,
  'index': 45,
  'word': 'Apple',
  'start': 189,
  'end': 194},
 {'entity': 'I-ORG',
  'score': 0.9989691,
  'index': 53,
  'word': 'Pi',
  'start': 237,
  'end': 239},
 {'entity': 'I-ORG',
  'score': 0.9961754,
  'index': 54,
  'word': '##xa',
  'start': 239,
  'end': 241},
 {'entity': 'I-ORG',
  'score': 0.9993247,
  'index': 55,
  'word': '##r',
  'start': 241,
  'end': 242},
 {'entity': 'I-ORG',
  'score': 0.9991516,
  'inde

## Question answering

In [37]:
question_answerer = pipeline('question-answering')

No model was supplied, defaulted to distilbert-base-cased-distilled-squad (https://huggingface.co/distilbert-base-cased-distilled-squad)


In [38]:
question_answerer(
    context = text,
    question = "Which companies are founded by Steve Jobs?"
)

{'score': 0.45512744784355164, 'start': 189, 'end': 194, 'answer': 'Apple'}

## Summarization

In [39]:
summarizer = pipeline("summarization")

No model was supplied, defaulted to sshleifer/distilbart-cnn-12-6 (https://huggingface.co/sshleifer/distilbart-cnn-12-6)


In [40]:
summarizer(text, max_length=64)

[{'summary_text': " Steven Paul Jobs was the co-founder, chairman, and CEO of Apple . He is widely recognized as a pioneer of the personal computer revolution of the 1970s and 1980s, along with his early business partner Steve Wozniak . He was a member of The Walt Disney Company's board of directors"}]

## Translation

brew install cmake
!pip install sentencepiece

In [41]:
translator = pipeline("translation", model="Helsinki-NLP/opus-mt-en-fr")

In [42]:
translator("Hello Jieun")

[{'translation_text': 'Bonjour Jieun'}]

In [43]:
translator(text)

[{'translation_text': "Steven Paul Jobs (24 février 1955 – 5 octobre 2011) était un entrepreneur américain, inventeur, magnat des affaires, propriétaire de médias et investisseur. Il était le cofondateur, président et directeur général d'Apple; le président et actionnaire majoritaire de Pixar; un membre du conseil d'administration de la Walt Disney Company suite à son acquisition de Pixar; et le fondateur, président et chef de la direction de NeXT. Il est largement reconnu comme un pionnier de la révolution informatique personnelle des années 1970 et 1980, ainsi que son premier associé et cofondateur d'Apple Steve Wozniak."}]

In [44]:
translator = pipeline("translation", model="Helsinki-NLP/opus-mt-ko-en")

In [45]:
text = "한국산 가상화폐 루나와 테라USD(UST) 폭락으로 손실을 본 투자자들이 발행사 테라폼랩스의 권도형 최고경영자(CEO)를 고소했다."

In [46]:
translator(text)

[{'translation_text': "After losing a Korean virtual currency, Luna turusD (UST), investors filed charges against CEO's high-powered top manager for the launch service terafos."}]

## Sentiment Analysis - Korean

In [2]:
classifier = pipeline('sentiment-analysis', model='snunlp/KR-FinBert-SC')

In [3]:
text = [
    "한국산 가상화폐 루나와 테라USD(UST) 폭락으로 손실을 본 투자자들이 발행사 테라폼랩스의 권도형 최고경영자(CEO)를 고소했다.",
    "외국인, 올해 국내 주식 15조 원 순매도…삼성만 5조 원 팔았다",
    '尹, 탈원전 정상화 추진 “원전 수출 증진 위해 韓美 노력”',
]

In [4]:
classifier(text)

[{'label': 'negative', 'score': 0.9798453450202942},
 {'label': 'negative', 'score': 0.9699411988258362},
 {'label': 'positive', 'score': 0.995445728302002}]