# Quick Experiment
A short test to verify that `torch`, `transformers`, and `scikit-learn` are working.

In [None]:
# Install dependencies (only needed once per environment)
!uv add torch transformers scikit-learn pandas numpy

In [None]:
import torch
from transformers import AutoTokenizer, AutoModel
from sklearn.cluster import KMeans
import numpy as np
import pandas as pd

print('Torch:', torch.__version__)
print('Transformers:', __import__('transformers').__version__)
print('scikit-learn:', __import__('sklearn').__version__)

In [None]:
# Quick embedding experiment
model_name = 'distilbert-base-uncased'
tokenizer = AutoTokenizer.from_pretrained(model_name)
model = AutoModel.from_pretrained(model_name)

sentences = [
    'I love machine learning.',
    'Deep learning is amazing.',
    'Transformers are powerful.',
    'I enjoy learning about AI.'
]

inputs = tokenizer(sentences, padding=True, truncation=True, return_tensors='pt')
with torch.no_grad():
    outputs = model(**inputs).last_hidden_state.mean(dim=1)

embeddings = outputs.numpy()

# Cluster embeddings to verify sklearn works
km = KMeans(n_clusters=2, n_init='auto')
labels = km.fit_predict(embeddings)

pd.DataFrame({'sentence': sentences, 'cluster': labels})