In [1]:
import nltk
#nltk.download('punkt')  # Download required data

text = "Natural Language Processing is fun! Let's learn NLP."

# Word Tokenization
words = nltk.word_tokenize(text)
print("Word Tokens:", words)
# Output: ['Natural', 'Language', 'Processing', 'is', 'fun', '!', 'Let', "'s", 'learn', 'NLP', '.']

# Sentence Tokenization
sentences = nltk.sent_tokenize(text)
print("Sentence Tokens:", sentences)
# Output: ['Natural Language Processing is fun!', "Let's learn NLP."]

Word Tokens: ['Natural', 'Language', 'Processing', 'is', 'fun', '!', 'Let', "'s", 'learn', 'NLP', '.']
Sentence Tokens: ['Natural Language Processing is fun!', "Let's learn NLP."]


In [2]:
from textblob import TextBlob

blob = TextBlob("Natural Language Processing is fun! Let's learn NLP.")

# Word Tokenization
print("Word Tokens:", blob.words)
# Output: ['Natural', 'Language', 'Processing', 'is', 'fun', 'Let', "'s", 'learn', 'NLP']

# Sentence Tokenization
print("Sentence Tokens:", blob.sentences)
# Output: [Sentence("Natural Language Processing is fun!"), Sentence("Let's learn NLP.")]

Word Tokens: ['Natural', 'Language', 'Processing', 'is', 'fun', 'Let', "'s", 'learn', 'NLP']
Sentence Tokens: [Sentence("Natural Language Processing is fun!"), Sentence("Let's learn NLP.")]


In [3]:
#nltk.download('averaged_perceptron_tagger')

text = "I love coding in Python."
tokens = nltk.word_tokenize(text)
pos_tags = nltk.pos_tag(tokens)
print("POS Tags:", pos_tags)
# Output: [('I', 'PRP'), ('love', 'VBP'), ('coding', 'VBG'), ('in', 'IN'), ('Python', 'NNP'), ('.', '.')]

POS Tags: [('I', 'PRP'), ('love', 'VBP'), ('coding', 'VBG'), ('in', 'IN'), ('Python', 'NNP'), ('.', '.')]


In [4]:
blob = TextBlob("I love coding in Python.")
print("POS Tags:", blob.tags)
# Output: [('I', 'PRP'), ('love', 'VBP'), ('coding', 'VBG'), ('in', 'IN'), ('Python', 'NNP')]

POS Tags: [('I', 'PRP'), ('love', 'VBP'), ('coding', 'VBG'), ('in', 'IN'), ('Python', 'NNP')]


In [5]:
from textblob import TextBlob

text = "I hate rainy days, but I love Python!"
blob = TextBlob(text)

# Polarity (-1 to 1: Negative to Positive)
print("Sentiment Polarity:", blob.sentiment.polarity)  # Output: 0.35 (Slightly Positive)

# Subjectivity (0 to 1: Objective to Subjective)
print("Subjectivity:", blob.sentiment.subjectivity)    # Output: 0.6 (Fairly Subjective)

Sentiment Polarity: -0.08750000000000002
Subjectivity: 0.75


In [6]:
blob = TextBlob("Bonjour le monde!")
print("Translated to English:", blob.translate(to='en'))
# Output: "Hello world!"

AttributeError: 'TextBlob' object has no attribute 'translate'

In [8]:
blob = TextBlob("Natural Language Processing is a subfield of AI.")
print("Noun Phrases:", blob.noun_phrases)
# Output: ['natural language processing', 'subfield', 'ai']

Noun Phrases: ['language processing', 'ai']


In [9]:
blob = TextBlob("I lve Pythn!")
print("Corrected Text:", blob.correct())
# Output: "I love Python!"

Corrected Text: I love Myth!


In [10]:
from textblob import Word

word = Word("apple")
print("Plural:", word.pluralize())  # Output: "apples"

word = Word("boxes")
print("Singular:", word.singularize())  # Output: "box"

Plural: apples
Singular: box


In [11]:
from nltk import FreqDist

text = "apple banana apple orange banana apple"
tokens = nltk.word_tokenize(text)
freq_dist = FreqDist(tokens)

print("Frequency Distribution:", freq_dist.most_common())
# Output: [('apple', 3), ('banana', 2), ('orange', 1)]

Frequency Distribution: [('apple', 3), ('banana', 2), ('orange', 1)]


In [12]:
nltk.download('stopwords')
from nltk.corpus import stopwords

text = "This is a sample sentence showing off stopword filtration."
tokens = nltk.word_tokenize(text)

stop_words = set(stopwords.words('english'))
filtered_words = [word for word in tokens if word.lower() not in stop_words]

print("Filtered Words:", filtered_words)
# Output: ['sample', 'sentence', 'showing', 'stopword', 'filtration', '.']

Filtered Words: ['sample', 'sentence', 'showing', 'stopword', 'filtration', '.']


[nltk_data] Downloading package stopwords to
[nltk_data]     /home/learntechbyme/nltk_data...
[nltk_data]   Package stopwords is already up-to-date!


In [13]:
nltk.download('wordnet')
from nltk.corpus import wordnet

synonyms = []
for syn in wordnet.synsets("happy"):
    for lemma in syn.lemmas():
        synonyms.append(lemma.name())

print("Synonyms for 'happy':", set(synonyms))
# Output: {'felicitous', 'glad', 'happy', 'well-chosen', 'content', ...}

[nltk_data] Downloading package wordnet to
[nltk_data]     /home/learntechbyme/nltk_data...
[nltk_data]   Package wordnet is already up-to-date!


Synonyms for 'happy': {'well-chosen', 'felicitous', 'glad', 'happy'}
