# About this notbook
This is an example notebook for Nectar AI-Ready LLM image.

This image contains the following pre-installed libraries:
- datasets
- matplotlib
- nltk
- numpy
- pandas
- plotly
- regex
- rouge_score
- safetensors
- scikit-learn
- seaborn
- torch
- tqdm
- transformers[torch]
- wordcloud
- textblob
- gensim
- sentencepiece
- sentence-transformers

# Import Libraries

In [None]:
import nltk
from sklearn.datasets import fetch_20newsgroups
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.naive_bayes import MultinomialNB
from sklearn.pipeline import make_pipeline
from transformers import pipeline

nltk.download('punkt')


# Text Classification with Scikit-learn

In [None]:
# Load dataset
data = fetch_20newsgroups(subset='train', categories=['sci.space', 'rec.sport.baseball'])
X, y = data.data, data.target

# Create and train a model
model = make_pipeline(CountVectorizer(), MultinomialNB())
model.fit(X, y)

# Predict on a new sample
sample_text = ["NASA announced a new mission to Mars."]
predicted_category = model.predict(sample_text)
print(f"Predicted Category: {data.target_names[predicted_category[0]]}")

# Text Generation with Hugging Face Transformers

In [None]:
# Using a text generation pipeline
generator = pipeline("text-generation", model="gpt2")
prompt = "Artificial Intelligence is transforming the world"
result = generator(prompt, max_length=50, num_return_sequences=1)
print(result[0]['generated_text'])


# Sentiment Analysis

In [None]:
sentiment_analyzer = pipeline("sentiment-analysis")

text = "I love how easy machine learning has become with modern libraries!"
result = sentiment_analyzer(text)

print(f"Text: {text}")
print(f"Sentiment: {result[0]['label']}, Confidence: {result[0]['score']:.2f}")

# Remove cache files

In [None]:
# Uncomment the line below to clean the cache files
# !rm -rf ~/.cache/huggingface/hub