# **POS Tagging**

In [None]:
import nltk
from nltk.tokenize import word_tokenize

# Download NLTK resources (required only once)
nltk.download('punkt')
nltk.download('averaged_perceptron_tagger')

[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package averaged_perceptron_tagger to
[nltk_data]     /root/nltk_data...
[nltk_data]   Package averaged_perceptron_tagger is already up-to-
[nltk_data]       date!


True

In [None]:
def pos_tagging(text):
    tokens = word_tokenize(text)
    tagged = nltk.pos_tag(tokens)
    return tagged

In [None]:
# Example text
text = "I want to go to the park."

# Perform POS tagging
tagged_text = pos_tagging(text)
print(tagged_text)

[('I', 'PRP'), ('want', 'VBP'), ('to', 'TO'), ('go', 'VB'), ('to', 'TO'), ('the', 'DT'), ('park', 'NN'), ('.', '.')]


# **Word embeddings**

In [None]:
from gensim.models import Word2Vec
import nltk
from nltk.tokenize import word_tokenize

# Download NLTK resources (required only once)
nltk.download('punkt')

[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data]   Package punkt is already up-to-date!


True

In [None]:
def word_embeddings(sentences, vector_size=100, window=5, min_count=1, epochs=10):
    tokenized_sentences = [word_tokenize(sentence.lower()) for sentence in sentences]
    model = Word2Vec(tokenized_sentences, vector_size=vector_size, window=window, min_count=min_count, epochs=epochs)
    return model

In [None]:
# Example sentences
sentences = [
    "I want to go to the park.",
    "She enjoys reading books in the garden.",
    "The cat is sleeping on the mat."
]

# Train Word2Vec model
model = word_embeddings(sentences)

# Get word embeddings
word_embedding = model.wv['cat']
print("Word embedding for 'cat':", word_embedding)


Word embedding for 'cat': [ 7.6983306e-03  9.1193542e-03  1.1321096e-03 -8.3294185e-03
  8.4265247e-03 -3.6914316e-03  5.7402989e-03  4.3932120e-03
  9.6893338e-03 -9.2889443e-03  9.2063379e-03 -9.2823664e-03
 -6.9066901e-03 -9.1030970e-03 -5.5502160e-03  7.3666577e-03
  9.1618039e-03 -3.3242418e-03  3.7236006e-03 -3.6290367e-03
  7.8815306e-03  5.8687106e-03 -1.5499239e-06 -3.6241789e-03
 -7.2267647e-03  4.7698859e-03  1.4596012e-03 -2.6145463e-03
  7.8351870e-03 -4.0522567e-03 -9.1507761e-03 -2.2569646e-03
  1.2432506e-04 -6.6407844e-03 -5.4887622e-03 -8.5008014e-03
  9.2301471e-03  7.4222847e-03 -3.0170722e-04  7.3647597e-03
  7.9488158e-03 -7.8362640e-04  6.6117863e-03  3.7735801e-03
  5.0829053e-03  7.2518708e-03 -4.7443109e-03 -2.1883291e-03
  8.7383558e-04  4.2336206e-03  3.3009520e-03  5.0983462e-03
  4.5866645e-03 -8.4428051e-03 -3.1860210e-03 -7.2424263e-03
  9.6759908e-03  4.9993284e-03  1.6937067e-04  4.1092434e-03
 -7.6511120e-03 -6.2980973e-03  3.0816491e-03  6.5389574e-0