In [None]:
!pip -q install -U transformers accelerate sentencepiece

In [None]:
import tensorflow as tf, torch

print("TF version:", tf.__version__)
print("TF GPU:", tf.config.list_physical_devices("GPU"))
print("Torch version:", torch.__version__)
print("Torch CUDA available:", torch.cuda.is_available())

TF version: 2.19.0
TF GPU: [PhysicalDevice(name='/physical_device:GPU:0', device_type='GPU')]
Torch version: 2.9.0+cu126
Torch CUDA available: True


In [None]:
from transformers import pipeline

clf = pipeline("sentiment-analysis")
# 기본 모델 자동 선택(환경/버전에 따라 달라질 수 있음)

texts = [
    "I love this movie!",
    "This is terrible.",
    "It is okay, not bad."
]

out = clf(texts)
for t, r in zip(texts, out):
    print(t, "->", r)

No model was supplied, defaulted to distilbert/distilbert-base-uncased-finetuned-sst-2-english and revision 714eb0f (https://huggingface.co/distilbert/distilbert-base-uncased-finetuned-sst-2-english).
Using a pipeline without specifying a model name and revision in production is not recommended.
The secret `HF_TOKEN` does not exist in your Colab secrets.
To authenticate with the Hugging Face Hub, create a token in your settings tab (https://huggingface.co/settings/tokens), set it as secret in your Google Colab and restart your session.
You will be able to reuse this secret in all of your notebooks.
Please note that authentication is recommended but still optional to access public models or datasets.


config.json:   0%|          | 0.00/629 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/268M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/48.0 [00:00<?, ?B/s]

vocab.txt: 0.00B [00:00, ?B/s]

Device set to use cuda:0


I love this movie! -> {'label': 'POSITIVE', 'score': 0.9998775720596313}
This is terrible. -> {'label': 'NEGATIVE', 'score': 0.9996345043182373}
It is okay, not bad. -> {'label': 'POSITIVE', 'score': 0.9997650980949402}


In [None]:
from transformers import pipeline

translator = pipeline("translation", model="Helsinki-NLP/opus-mt-ko-en")

text = "저는 콜랩에서 허깅페이스를 실행하고 있어요."
print(translator(text, max_length=64))

config.json: 0.00B [00:00, ?B/s]

pytorch_model.bin:   0%|          | 0.00/312M [00:00<?, ?B/s]

generation_config.json:   0%|          | 0.00/293 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/312M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/44.0 [00:00<?, ?B/s]

source.spm:   0%|          | 0.00/842k [00:00<?, ?B/s]

target.spm:   0%|          | 0.00/813k [00:00<?, ?B/s]

vocab.json: 0.00B [00:00, ?B/s]

Device set to use cuda:0


[{'translation_text': "I'm running a Huggingspace at the Collab."}]


In [None]:
from transformers import pipeline

summ = pipeline("summarization")

doc = (
    "Hugging Face provides open-source tools and models for natural language processing and more. "
    "It enables quick prototyping with pipelines, supports fine-tuning on custom datasets, and "
    "offers an ecosystem including model hub, datasets, and spaces for demos."
)

print(summ(doc, max_length=40, min_length=15))

No model was supplied, defaulted to sshleifer/distilbart-cnn-12-6 and revision a4f8f3e (https://huggingface.co/sshleifer/distilbart-cnn-12-6).
Using a pipeline without specifying a model name and revision in production is not recommended.


config.json: 0.00B [00:00, ?B/s]

pytorch_model.bin:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.22G [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/26.0 [00:00<?, ?B/s]

vocab.json: 0.00B [00:00, ?B/s]

merges.txt: 0.00B [00:00, ?B/s]

Device set to use cuda:0


[{'summary_text': ' Hugging Face provides open-source tools and models for natural language processing and more . It enables quick prototyping with pipelines, supports fine-tuning on custom datasets, and offers an'}]


In [None]:
from transformers import pipeline

ner = pipeline("ner", grouped_entities=True)
print(ner("Apple is looking at buying U.K. startup for $1 billion."))

No model was supplied, defaulted to dbmdz/bert-large-cased-finetuned-conll03-english and revision 4c53496 (https://huggingface.co/dbmdz/bert-large-cased-finetuned-conll03-english).
Using a pipeline without specifying a model name and revision in production is not recommended.


config.json:   0%|          | 0.00/998 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/1.33G [00:00<?, ?B/s]

Some weights of the model checkpoint at dbmdz/bert-large-cased-finetuned-conll03-english were not used when initializing BertForTokenClassification: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight']
- This IS expected if you are initializing BertForTokenClassification from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForTokenClassification from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).


tokenizer_config.json:   0%|          | 0.00/60.0 [00:00<?, ?B/s]

vocab.txt: 0.00B [00:00, ?B/s]

Device set to use cuda:0


[{'entity_group': 'ORG', 'score': np.float32(0.9990897), 'word': 'Apple', 'start': 0, 'end': 5}, {'entity_group': 'LOC', 'score': np.float32(0.999718), 'word': 'U', 'start': 27, 'end': 28}, {'entity_group': 'LOC', 'score': np.float32(0.9987226), 'word': 'K', 'start': 29, 'end': 30}]




In [None]:
from transformers import pipeline

qa = pipeline("question-answering")

result = qa(
    question="Where do I live?",
    context="My name is Sarah and I live in London."
)
print(result)

No model was supplied, defaulted to distilbert/distilbert-base-cased-distilled-squad and revision 564e9b5 (https://huggingface.co/distilbert/distilbert-base-cased-distilled-squad).
Using a pipeline without specifying a model name and revision in production is not recommended.


config.json:   0%|          | 0.00/473 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/261M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/49.0 [00:00<?, ?B/s]

vocab.txt: 0.00B [00:00, ?B/s]

tokenizer.json: 0.00B [00:00, ?B/s]

Device set to use cuda:0


{'score': 0.9736034870147705, 'start': 31, 'end': 37, 'answer': 'London'}


In [None]:
from transformers import pipeline

gen = pipeline("text-generation", model="gpt2")
print(gen("Today I learned that", max_new_tokens=30)[0]["generated_text"])

config.json:   0%|          | 0.00/665 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/548M [00:00<?, ?B/s]

generation_config.json:   0%|          | 0.00/124 [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/26.0 [00:00<?, ?B/s]

vocab.json:   0%|          | 0.00/1.04M [00:00<?, ?B/s]

merges.txt:   0%|          | 0.00/456k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/1.36M [00:00<?, ?B/s]

Device set to use cuda:0
Setting `pad_token_id` to `eos_token_id`:50256 for open-end generation.


Today I learned that the United States government has the capability to intervene in countries that don't think they can do everything that we can to prevent the spread of terrorism. We


In [None]:
from transformers import pipeline

fm = pipeline("fill-mask", model="bert-base-uncased")
out = fm("Paris is the [MASK] of France.")
for o in out:
    print(o["sequence"], "score=", round(o["score"], 4))

config.json:   0%|          | 0.00/570 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/440M [00:00<?, ?B/s]

Some weights of the model checkpoint at bert-base-uncased were not used when initializing BertForMaskedLM: ['bert.pooler.dense.bias', 'bert.pooler.dense.weight', 'cls.seq_relationship.bias', 'cls.seq_relationship.weight']
- This IS expected if you are initializing BertForMaskedLM from the checkpoint of a model trained on another task or with another architecture (e.g. initializing a BertForSequenceClassification model from a BertForPreTraining model).
- This IS NOT expected if you are initializing BertForMaskedLM from the checkpoint of a model that you expect to be exactly identical (initializing a BertForSequenceClassification model from a BertForSequenceClassification model).


tokenizer_config.json:   0%|          | 0.00/48.0 [00:00<?, ?B/s]

vocab.txt:   0%|          | 0.00/232k [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/466k [00:00<?, ?B/s]

Device set to use cuda:0


paris is the capital of france. score= 0.9969
paris is the heart of france. score= 0.0006
paris is the center of france. score= 0.0004
paris is the centre of france. score= 0.0003
paris is the city of france. score= 0.0003


In [None]:
from transformers import pipeline

zs = pipeline("zero-shot-classification", model="facebook/bart-large-mnli")

text = "오늘은 딥러닝 CNN 모델을 학습했어."
labels = ["sports", "technology", "cooking", "finance"]

print(zs(text, candidate_labels=labels))

config.json: 0.00B [00:00, ?B/s]

model.safetensors:   0%|          | 0.00/1.63G [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/26.0 [00:00<?, ?B/s]

vocab.json: 0.00B [00:00, ?B/s]

merges.txt: 0.00B [00:00, ?B/s]

tokenizer.json: 0.00B [00:00, ?B/s]

Device set to use cuda:0


{'sequence': '오늘은 딥러닝 CNN 모델을 학습했어.', 'labels': ['cooking', 'technology', 'sports', 'finance'], 'scores': [0.37041088938713074, 0.25491923093795776, 0.25371429324150085, 0.12095552682876587]}


In [None]:
from sentence_transformers import SentenceTransformer, util

m = SentenceTransformer("sentence-transformers/paraphrase-multilingual-MiniLM-L12-v2")

s1 = "딥러닝 모델 배포 방법을 알려줘"
s2 = "머신러닝 서비스를 운영 환경에 배포하는 방법은?"
s3 = "오늘 점심 뭐 먹지?"

emb = m.encode([s1, s2, s3], convert_to_tensor=True)
sim12 = util.cos_sim(emb[0], emb[1]).item()
sim13 = util.cos_sim(emb[0], emb[2]).item()

print("sim(s1, s2) =", round(sim12, 4))
print("sim(s1, s3) =", round(sim13, 4))

modules.json:   0%|          | 0.00/229 [00:00<?, ?B/s]

config_sentence_transformers.json:   0%|          | 0.00/122 [00:00<?, ?B/s]

README.md: 0.00B [00:00, ?B/s]

sentence_bert_config.json:   0%|          | 0.00/53.0 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/645 [00:00<?, ?B/s]

model.safetensors:   0%|          | 0.00/471M [00:00<?, ?B/s]

tokenizer_config.json:   0%|          | 0.00/480 [00:00<?, ?B/s]

tokenizer.json:   0%|          | 0.00/9.08M [00:00<?, ?B/s]

special_tokens_map.json:   0%|          | 0.00/239 [00:00<?, ?B/s]

config.json:   0%|          | 0.00/190 [00:00<?, ?B/s]

sim(s1, s2) = 0.203
sim(s1, s3) = 0.4881


In [None]:
!wget -q https://huggingface.co/datasets/huggingface/documentation-images/resolve/main/coco_sample.png -O sample.png

In [None]:
from transformers import pipeline

imgclf = pipeline("image-classification", model="google/vit-base-patch16-224")
print(imgclf("sample.png")[:3])

Fast image processor class <class 'transformers.models.vit.image_processing_vit_fast.ViTImageProcessorFast'> is available for this model. Using slow image processor class. To use the fast image processor class set `use_fast=True`.
Device set to use cuda:0


[{'label': 'Egyptian cat', 'score': 0.9374414682388306}, {'label': 'tabby, tabby cat', 'score': 0.03844264894723892}, {'label': 'tiger cat', 'score': 0.01441141590476036}]


In [None]:
from transformers import pipeline

zs = pipeline("zero-shot-classification", model="facebook/bart-large-mnli")

text = "오늘은 딥러닝 CNN 모델을 학습했어."
labels = ["AI", "sports", "movie", "travel"]

print(zs(text, candidate_labels=labels))

Device set to use cuda:0


{'sequence': '오늘은 딥러닝 CNN 모델을 학습했어.', 'labels': ['movie', 'travel', 'sports', 'AI'], 'scores': [0.4336470663547516, 0.33403483033180237, 0.1401580572128296, 0.09216004610061646]}


In [None]:
from transformers import pipeline

summ = pipeline("summarization")
clf = pipeline("sentiment-analysis")

doc = (
    "Hugging Face provides open-source tools and models for natural language processing and more. "
    "It enables quick prototyping with pipelines, supports fine-tuning on custom datasets, and "
    "offers an ecosystem including model hub, datasets, and spaces for demos."
)

print(summ(doc, max_length=100, min_length=50))

In [None]:
from transformers import pipeline

translator = pipeline("translation", model="Helsinki-NLP/opus-mt-ko-en")
summ = pipeline("summarization")

text = "전국철도노동조합(철도노조)이 23일 오전 9시부터 무기한 총파업에 돌입하겠다고 예고했다. 한국철도공사(코레일)은 파업이 시작되면 수도권 전철과 지방 광역전철 전반에서 평시 대비 25% 감축 운행이 불가피할 것으로 전망했다.철도노조는 23일로 예고한 총파업을 하루 앞두고 “노동조합의 명운을 걸고 싸우겠다”며 전국의 각 지부 조직을 점검 중이라고 22일 밝혔다. 1만2000여명의 파업 참여가 예상되며, 근무 인원의 경우에도 시간외·휴일근로를 전면 거부하는 준법 투쟁에 돌입한다.파업 시 예상되는 노선별 평시 대비 운행률은 수도권 전철 75.4%(출근 시간대 90% 이상), 경강선 73%(출근 89.5%), 대경선 76.3%(출근 78.6%), 동해선 70.3%(출근 78.6%), 경의중앙선 74%(출근 90.6%) 수준이다."
result = translator(text, max_length=64)
trans = result[0]['translation_text']

sum = summ(trans, max_length=64, min_length=15)
print(sum[0]['summary_text'])

Device set to use cuda:0
No model was supplied, defaulted to sshleifer/distilbart-cnn-12-6 and revision a4f8f3e (https://huggingface.co/sshleifer/distilbart-cnn-12-6).
Using a pipeline without specifying a model name and revision in production is not recommended.
Device set to use cuda:0
Your input_length: 248 is bigger than 0.9 * max_length: 64. You might consider increasing your max_length manually, e.g. translator('...', max_length=400)
Your max_length is set to 64, but your input_length is only 60. Since this is a summarization task, where outputs shorter than the input are typically wanted, you might consider decreasing max_length manually, e.g. summarizer('...', max_length=30)


 The National Railways Union (Cyress) has predicted a total strike of arms since 9:00 a.m. on 23 a .m., and the Korean Railway has predicted that the strike will require 25 percent reductions in water power .
