In [3]:
import nltk
from nltk.tokenize import word_tokenize
from gensim.models import Word2Vec, FastText
from glove import Corpus, Glove

# Ensure you have the necessary NLTK resources
nltk.download('punkt')

# Sample data
toy_data = [
    "word embeddings are fascinating",
    "word2vec captures semantic relationships",
    "GloVe considers global context",
    "FastText extends Word2Vec with subword information"
]

# Function to preprocess and tokenize the data
def preprocess_data(data):
    return [word_tokenize(sentence.lower()) for sentence in data]

# Function to train Word2Vec model
def train_word2vec(data):
    tokenized_sentences = preprocess_data(data)
    model = Word2Vec(sentences=tokenized_sentences, vector_size=100, window=5, min_count=1, workers=4)
    return model

# Function to train GloVe model
def train_glove(data):
    tokenized_sentences = preprocess_data(data)
    corpus = Corpus()
    corpus.fit(tokenized_sentences, window=5)
    glove = Glove(no_components=100, learning_rate=0.05)
    glove.fit(corpus.matrix, epochs=30, no_threads=4, verbose=True)
    return glove

# Function to train FastText model
def train_fasttext(data):
    tokenized_sentences = preprocess_data(data)
    model = FastText(sentences=tokenized_sentences, vector_size=100, window=5, min_count=1, workers=4)
    return model

# Main function to execute the training and display results
def main():
    # Train Word2Vec model
    word2vec_model = train_word2vec(toy_data)
    print("Word2Vec Embedding for 'word':", word2vec_model.wv['word'])

    # Train GloVe model
    glove_model = train_glove(toy_data)
    word = "glove"
    if word in glove_model.dictionary:
        embedding = glove_model.word_vectors[glove_model.dictionary[word]]
        print("GloVe Embedding for 'glove':", embedding)
    else:
        print(f"'{word}' not found in GloVe model.")

    # Train FastText model
    fasttext_model = train_fasttext(toy_data)
    print("FastText Embedding for 'fasttext':", fasttext_model.wv['fasttext'])

if __name__ == "__main__":
    main()

ModuleNotFoundError: No module named 'gensim'