In [1]:
#--------------------------------------------------
# EMBEDDING
#--------------------------------------------------

#python -m spacy download pt_core_news_md

import spacy

# Carregar modelo em português com embeddings
nlp = spacy.load("pt_core_news_md")

# Criar embeddings
palavra1 = nlp("rei")
palavra2 = nlp("rainha")
palavra3 = nlp("carro")

# Comparar similaridade
print("rei vs rainha:", palavra1.similarity(palavra2))
print("rei vs carro:", palavra1.similarity(palavra3))

# basicamente busca a similaridade entre as palavras, o quanto uma se agrupa a outra


rei vs rainha: 0.60012286901474
rei vs carro: 0.09075795114040375


In [4]:
#--------------------------------------------------
# TRANSFORMERS (VERSÃO ANTIGA)
#--------------------------------------------------

from transformers import pipeline

# Modelo clássico de resumo (compatível com versões antigas)
summarizer = pipeline(
    "text-generation",
    model="t5-small"
)

text = """
Artificial intelligence is transforming the world. With the help of transformer models, 
computers can now perform complex tasks like translation, summarization, and automated 
responses with high accuracy. Recent advances allow machines to understand complex contexts 
and generate coherent text. This technology is being applied in areas like customer service, 
healthcare, and education. According to research, the AI market will grow 30% annually 
over the next decade, creating new opportunities.
"""

# IMPORTANTE: prefixo "summarize:"
prompt = "summarize: " + text.replace("\n", " ")

summary = summarizer(
    prompt,
    max_length=120,
    do_sample=False,
    num_return_sequences=1
)

print("SUMMARY:", summary[0]["generated_text"])


To support symlinks on Windows, you either need to activate Developer Mode or to run Python as an administrator. In order to activate developer mode, see this article: https://docs.microsoft.com/en-us/windows/apps/get-started/enable-your-device-for-development
Loading weights: 100%|██████████| 131/131 [00:00<00:00, 1180.18it/s, Materializing param=shared.weight]                                                      
The model 'T5ForConditionalGeneration' is not supported for text-generation. Supported models are ['PeftModelForCausalLM', 'AfmoeForCausalLM', 'ApertusForCausalLM', 'ArceeForCausalLM', 'AriaTextForCausalLM', 'BambaForCausalLM', 'BartForCausalLM', 'BertLMHeadModel', 'BertGenerationDecoder', 'BigBirdForCausalLM', 'BigBirdPegasusForCausalLM', 'BioGptForCausalLM', 'BitNetForCausalLM', 'BlenderbotForCausalLM', 'BlenderbotSmallForCausalLM', 'BloomForCausalLM', 'BltForCausalLM', 'CamembertForCausalLM', 'LlamaForCausalLM', 'CodeGenForCausalLM', 'CohereForCausalLM', 'Cohere2ForCausal

SUMMARY: summarize:  Artificial intelligence is transforming the world. With the help of transformer models,  computers can now perform complex tasks like translation, summarization, and automated  responses with high accuracy. Recent advances allow machines to understand complex contexts  and generate coherent text. This technology is being applied in areas like customer service,  healthcare, and education. According to research, the AI market will grow 30% annually  over the next decade, creating new opportunities. 


In [1]:
#--------------------------------------------------
# FINE TUNING
#--------------------------------------------------
from transformers import pipeline

classificador = pipeline("sentiment-analysis", model="nlptown/bert-base-multilingual-uncased-sentiment")

frases = [
    "Este curso é excelente!",
    "Não gostei do conteúdo.",
    "Achei a explicação clara e objetiva.",
    "O conteúdo é bom, mas não foi objetivo"
]

for frase in frases:
    resultado = classificador(frase)[0]
    print(f"Frase: {frase} \nSentimento: {resultado['label']} com confiança de {resultado['score']:.2f}\n")

  from .autonotebook import tqdm as notebook_tqdm
Loading weights: 100%|██████████| 201/201 [00:00<00:00, 967.65it/s, Materializing param=classifier.weight]                                      


Frase: Este curso é excelente! 
Sentimento: 5 stars com confiança de 0.70

Frase: Não gostei do conteúdo. 
Sentimento: 1 star com confiança de 0.42

Frase: Achei a explicação clara e objetiva. 
Sentimento: 4 stars com confiança de 0.47

Frase: O conteúdo é bom, mas não foi objetivo 
Sentimento: 3 stars com confiança de 0.44

