In [None]:
import nltk
from nltk.tokenize import word_tokenize, sent_tokenize
from nltk import pos_tag

In [None]:
text = "Natural Language Processing allows computers to understand human language."

In [None]:
nltk.download('punkt')

[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data]   Unzipping tokenizers/punkt.zip.


True

In [None]:
sentences = sent_tokenize(text)

In [None]:
words = word_tokenize(text)

In [None]:
print("Sentences:", sentences)
print("Words:", words)

Sentences: ['Natural Language Processing allows computers to understand human language.']
Words: ['Natural', 'Language', 'Processing', 'allows', 'computers', 'to', 'understand', 'human', 'language', '.']


In [None]:
sample_words = word_tokenize("NLP is an interesting field.")

In [None]:
nltk.download('averaged_perceptron_tagger')

[nltk_data] Downloading package averaged_perceptron_tagger to
[nltk_data]     /root/nltk_data...
[nltk_data]   Unzipping taggers/averaged_perceptron_tagger.zip.


True

In [None]:
pos_tags = pos_tag(sample_words)

In [None]:
print("Part-of-Speech Tags:", pos_tags)

Part-of-Speech Tags: [('NLP', 'NNP'), ('is', 'VBZ'), ('an', 'DT'), ('interesting', 'JJ'), ('field', 'NN'), ('.', '.')]


In [None]:
import spacy

In [None]:
nlp = spacy.load("en_core_web_sm")

In [None]:
text = "Apple is looking to buy a startup in the UK for $1 billion."

In [None]:
doc = nlp(text)

In [None]:
for ent in doc.ents:
    print(ent.text, ent.label_)

Apple ORG
UK GPE
$1 billion MONEY


##LSTM

In [None]:
import numpy as np
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Embedding, LSTM, Dense, Dropout
from tensorflow.keras.preprocessing.text import Tokenizer
from tensorflow.keras.preprocessing.sequence import pad_sequences

In [None]:
# Example text data and labels
texts = ["I love natural language processing",
         "Machine learning is fascinating",
         "Deep learning models are powerful",
         "I enjoy working on NLP projects",
         "This is an excellent LSTM example"]

In [None]:
labels = [1, 1, 1, 1, 1]

In [None]:
tokenizer = Tokenizer(num_words=10000)

In [None]:
tokenizer.fit_on_texts(texts)

In [None]:
sequences = tokenizer.texts_to_sequences(texts)

In [None]:
max_length = 10

In [None]:
X = pad_sequences(sequences, maxlen=max_length)
y = np.array(labels)

In [None]:
model = Sequential()

In [None]:
model.add(Embedding(input_dim=10000, output_dim=128, input_length=max_length))



In [None]:
model.add(LSTM(128, return_sequences=False))

In [None]:
model.add(Dropout(0.2))

In [None]:
model.add(Dense(1, activation='sigmoid'))

In [None]:
model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])

In [None]:
model.summary()

In [None]:
model.fit(X, y, epochs=5, batch_size=32)

Epoch 1/5
[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m4s[0m 4s/step - accuracy: 0.8000 - loss: 0.6904
Epoch 2/5
[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 157ms/step - accuracy: 1.0000 - loss: 0.6616
Epoch 3/5
[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 107ms/step - accuracy: 1.0000 - loss: 0.6315
Epoch 4/5
[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 133ms/step - accuracy: 1.0000 - loss: 0.5947
Epoch 5/5
[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m0s[0m 144ms/step - accuracy: 1.0000 - loss: 0.5470


<keras.src.callbacks.history.History at 0x7b6404210490>

In [None]:
loss, accuracy = model.evaluate(X, y)
print(f"Loss: {loss}, Accuracy: {accuracy}")

[1m1/1[0m [32m━━━━━━━━━━━━━━━━━━━━[0m[37m[0m [1m1s[0m 568ms/step - accuracy: 1.0000 - loss: 0.4938
Loss: 0.49375468492507935, Accuracy: 1.0
