In [1]:
import pandas as pd
from gensim.models import Word2Vec

# CSV'den stem yapılmış veriyi oku
df = pd.read_csv("stemmed_data.csv")
tokenized_stemmed = df['text_stemmed_sentences'].dropna().apply(lambda x: x.split()).tolist()

# Parametreler
parameters = [
    {'model_type': 'cbow', 'window': 2, 'vector_size': 100},
    {'model_type': 'skipgram', 'window': 2, 'vector_size': 100},
    {'model_type': 'cbow', 'window': 4, 'vector_size': 100},
    {'model_type': 'skipgram', 'window': 4, 'vector_size': 100},
    {'model_type': 'cbow', 'window': 2, 'vector_size': 300},
    {'model_type': 'skipgram', 'window': 2, 'vector_size': 300},
    {'model_type': 'cbow', 'window': 4, 'vector_size': 300},
    {'model_type': 'skipgram', 'window': 4, 'vector_size': 300}
]

# Model eğitme fonksiyonu
def train_word2vec_model(corpus, param, corpus_type):
    sg = 1 if param['model_type'] == 'skipgram' else 0
    model = Word2Vec(
        sentences=corpus,
        vector_size=param['vector_size'],
        window=param['window'],
        sg=sg,
        min_count=1,
        workers=4,
        epochs=10
    )
    model_name = f"{corpus_type}_model_{param['model_type']}_window{param['window']}_dim{param['vector_size']}.model"
    model.save(model_name)
    print(f"✅ Stemmed model kaydedildi: {model_name}")
    return model

# Stemmed modelleri eğit
stemmed_models = []
for param in parameters:
    model = train_word2vec_model(tokenized_stemmed, param, "stemmed")
    stemmed_models.append((param, model))


✅ Stemmed model kaydedildi: stemmed_model_cbow_window2_dim100.model
✅ Stemmed model kaydedildi: stemmed_model_skipgram_window2_dim100.model
✅ Stemmed model kaydedildi: stemmed_model_cbow_window4_dim100.model
✅ Stemmed model kaydedildi: stemmed_model_skipgram_window4_dim100.model
✅ Stemmed model kaydedildi: stemmed_model_cbow_window2_dim300.model
✅ Stemmed model kaydedildi: stemmed_model_skipgram_window2_dim300.model
✅ Stemmed model kaydedildi: stemmed_model_cbow_window4_dim300.model
✅ Stemmed model kaydedildi: stemmed_model_skipgram_window4_dim300.model
