In [None]:
import gensim
import numpy as np
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score

# Load pre-trained Word2Vec embeddings
word2vec_model = gensim.models.KeyedVectors.load_word2vec_format('path_to_word2vec.bin', binary=True)

# Simulate an NLP dataset for text classification
texts = ["this is a positive example", "negative sentiment here", "a very positive review", "not good at all"]
labels = [1, 0, 1, 0]

# Tokenize and represent text as the mean of word vectors
def document_vectorizer(doc, model):
    words = doc.split()
    word_vectors = [model[word] for word in words if word in model]
    if not word_vectors:
        return np.zeros(model.vector_size)
    return np.mean(word_vectors, axis=0)

X = np.array([document_vectorizer(text, word2vec_model) for text in texts])
y = np.array(labels)

# Split the data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Train a simple logistic regression classifier on the fine-tuned embeddings
classifier = LogisticRegression()
classifier.fit(X_train, y_train)

# Make predictions and evaluate the model
y_pred = classifier.predict(X_test)
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy}")
