importing libraries and downloading important resources


In [None]:
# importing libraries
import nltk
from nltk.tokenize import word_tokenize
from nltk.corpus import stopwords
from nltk.stem import PorterStemmer,WordNetLemmatizer

# download required nltk resources
nltk.download('punkt_tab')
nltk.download('stopwords')
nltk.download('wordnet')
nltk.download('omw-1.4')

[nltk_data] Downloading package punkt_tab to /root/nltk_data...
[nltk_data]   Unzipping tokenizers/punkt_tab.zip.
[nltk_data] Downloading package stopwords to /root/nltk_data...
[nltk_data]   Unzipping corpora/stopwords.zip.
[nltk_data] Downloading package wordnet to /root/nltk_data...
[nltk_data] Downloading package omw-1.4 to /root/nltk_data...


True

Defining the paragraph.

In [None]:
paragraph = (
    "Technology plays a vital role in today’s world, reshaping how people "
    "work, connect, and gain knowledge. From mobile devices to artificial "
    "intelligence, innovations have greatly enhanced productivity and comfort "
    "across various industries. In education, digital platforms enable students "
    "to learn from anywhere, and in healthcare, advanced tools and data-driven "
    "diagnostics help save countless lives. Yet, the rapid rise of technology "
    "also brings challenges such as privacy risks, job displacement, and growing "
    "reliance on machines. Hence, while technology offers remarkable advantages, "
    "it must be used thoughtfully to ensure sustainable and balanced progress."
)
print(paragraph)


Technology plays a vital role in today’s world, reshaping how people work, connect, and gain knowledge. From mobile devices to artificial intelligence, innovations have greatly enhanced productivity and comfort across various industries. In education, digital platforms enable students to learn from anywhere, and in healthcare, advanced tools and data-driven diagnostics help save countless lives. Yet, the rapid rise of technology also brings challenges such as privacy risks, job displacement, and growing reliance on machines. Hence, while technology offers remarkable advantages, it must be used thoughtfully to ensure sustainable and balanced progress.


Tokenization : This splits the paragraph into individual words and punctuation marks


In [None]:
tokens = word_tokenize(paragraph)
print("Token")
print(tokens)

Token
['Technology', 'plays', 'a', 'vital', 'role', 'in', 'today', '’', 's', 'world', ',', 'reshaping', 'how', 'people', 'work', ',', 'connect', ',', 'and', 'gain', 'knowledge', '.', 'From', 'mobile', 'devices', 'to', 'artificial', 'intelligence', ',', 'innovations', 'have', 'greatly', 'enhanced', 'productivity', 'and', 'comfort', 'across', 'various', 'industries', '.', 'In', 'education', ',', 'digital', 'platforms', 'enable', 'students', 'to', 'learn', 'from', 'anywhere', ',', 'and', 'in', 'healthcare', ',', 'advanced', 'tools', 'and', 'data-driven', 'diagnostics', 'help', 'save', 'countless', 'lives', '.', 'Yet', ',', 'the', 'rapid', 'rise', 'of', 'technology', 'also', 'brings', 'challenges', 'such', 'as', 'privacy', 'risks', ',', 'job', 'displacement', ',', 'and', 'growing', 'reliance', 'on', 'machines', '.', 'Hence', ',', 'while', 'technology', 'offers', 'remarkable', 'advantages', ',', 'it', 'must', 'be', 'used', 'thoughtfully', 'to', 'ensure', 'sustainable', 'and', 'balanced', 'p

Stopword Removal : This removes common english words like "is","the","and",etc. Keeping only meaningful words.

In [None]:
stop_words = set(stopwords.words('english'))
filtered_tokens = [word for word in tokens if word.lower() not in stop_words and word.isalpha()]
print("after stopword removal")
print(filtered_tokens)

after stopword removal
['Technology', 'plays', 'vital', 'role', 'today', 'world', 'reshaping', 'people', 'work', 'connect', 'gain', 'knowledge', 'mobile', 'devices', 'artificial', 'intelligence', 'innovations', 'greatly', 'enhanced', 'productivity', 'comfort', 'across', 'various', 'industries', 'education', 'digital', 'platforms', 'enable', 'students', 'learn', 'anywhere', 'healthcare', 'advanced', 'tools', 'diagnostics', 'help', 'save', 'countless', 'lives', 'Yet', 'rapid', 'rise', 'technology', 'also', 'brings', 'challenges', 'privacy', 'risks', 'job', 'displacement', 'growing', 'reliance', 'machines', 'Hence', 'technology', 'offers', 'remarkable', 'advantages', 'must', 'used', 'thoughtfully', 'ensure', 'sustainable', 'balanced', 'progress']


Stemming : Reduce a word to its root forms often not actual words

In [None]:
stemmer = PorterStemmer()
stemmed_words = [stemmer.stem(word) for word in filtered_tokens]
print("after stemming")
print(stemmed_words)

after stemming
['technolog', 'play', 'vital', 'role', 'today', 'world', 'reshap', 'peopl', 'work', 'connect', 'gain', 'knowledg', 'mobil', 'devic', 'artifici', 'intellig', 'innov', 'greatli', 'enhanc', 'product', 'comfort', 'across', 'variou', 'industri', 'educ', 'digit', 'platform', 'enabl', 'student', 'learn', 'anywher', 'healthcar', 'advanc', 'tool', 'diagnost', 'help', 'save', 'countless', 'live', 'yet', 'rapid', 'rise', 'technolog', 'also', 'bring', 'challeng', 'privaci', 'risk', 'job', 'displac', 'grow', 'relianc', 'machin', 'henc', 'technolog', 'offer', 'remark', 'advantag', 'must', 'use', 'thought', 'ensur', 'sustain', 'balanc', 'progress']


Lemmatization : lemmatization returns dictionary base forms.

In [None]:
lemmatizer = WordNetLemmatizer()
lemmatized_words = [lemmatizer.lemmatize(word) for word in filtered_tokens]
print("After lemmatization")
print(lemmatized_words)

After lemmatization
['Technology', 'play', 'vital', 'role', 'today', 'world', 'reshaping', 'people', 'work', 'connect', 'gain', 'knowledge', 'mobile', 'device', 'artificial', 'intelligence', 'innovation', 'greatly', 'enhanced', 'productivity', 'comfort', 'across', 'various', 'industry', 'education', 'digital', 'platform', 'enable', 'student', 'learn', 'anywhere', 'healthcare', 'advanced', 'tool', 'diagnostics', 'help', 'save', 'countless', 'life', 'Yet', 'rapid', 'rise', 'technology', 'also', 'brings', 'challenge', 'privacy', 'risk', 'job', 'displacement', 'growing', 'reliance', 'machine', 'Hence', 'technology', 'offer', 'remarkable', 'advantage', 'must', 'used', 'thoughtfully', 'ensure', 'sustainable', 'balanced', 'progress']
