In [8]:
corpus = """Good morning everyone,
Today, I don’t want to talk to you about success.
I don’t want to talk about failure either.
I want to talk to you about the space between the two — the part no one posts on LinkedIn, no one puts on Instagram, and no one applauds.
That space is called the journey.
You see, we live in a world that celebrates outcomes.
We clap for degrees, titles, salaries, rankings, followers, and results.
But we rarely talk about the nights of doubt, the confusion, the fear of being left behind, and the quiet resilience it takes to keep going when nobody is watching.
Every single person sitting here today is on a different timeline.
And yet, we constantly compare our Chapter 3 with someone else’s Chapter 20.
Let me tell you something important:
Life is not a race. It is a process.
Some people discover their purpose early.
Some discover it late.
Some change it multiple times.
None of that makes you behind.
What does put you behind is quitting on yourself because your progress doesn’t look like someone else’s highlight reel.
You will have moments where you question your abilities.
Moments where you wonder if you chose the right path.
Moments where you feel like everyone else has figured it out except you.
Let me be honest with you — most people are figuring it out as they go.
Confidence is not clarity.
Often, it’s just courage wearing a calm face.
The truth is, growth is uncomfortable.
Transformation is messy.
And progress is often invisible while it’s happening.
When you plant a seed, you don’t dig it up every day to check if it’s growing.
You water it.
You protect it.
You trust the process.
It tells you what didn’t work.
It sharpens your judgment.
It humbles your ego and strengthens your character.
The only real failure is refusing to learn.
So walk out of this room with patience for yourself.
With belief in your ability to grow.
And with the courage to continue, even when the path feels unclear.
Your story is still being written.
And the next chapter is waiting for you to show up.
Thank you."""

In [1]:
import nltk
from nltk.corpus import stopwords
nltk.download("stopwords")

[nltk_data] Downloading package stopwords to
[nltk_data]     C:\Users\anand\AppData\Roaming\nltk_data...
[nltk_data]   Unzipping corpora\stopwords.zip.


True

In [4]:
stopwords.words("english")

['a',
 'about',
 'above',
 'after',
 'again',
 'against',
 'ain',
 'all',
 'am',
 'an',
 'and',
 'any',
 'are',
 'aren',
 "aren't",
 'as',
 'at',
 'be',
 'because',
 'been',
 'before',
 'being',
 'below',
 'between',
 'both',
 'but',
 'by',
 'can',
 'couldn',
 "couldn't",
 'd',
 'did',
 'didn',
 "didn't",
 'do',
 'does',
 'doesn',
 "doesn't",
 'doing',
 'don',
 "don't",
 'down',
 'during',
 'each',
 'few',
 'for',
 'from',
 'further',
 'had',
 'hadn',
 "hadn't",
 'has',
 'hasn',
 "hasn't",
 'have',
 'haven',
 "haven't",
 'having',
 'he',
 "he'd",
 "he'll",
 'her',
 'here',
 'hers',
 'herself',
 "he's",
 'him',
 'himself',
 'his',
 'how',
 'i',
 "i'd",
 'if',
 "i'll",
 "i'm",
 'in',
 'into',
 'is',
 'isn',
 "isn't",
 'it',
 "it'd",
 "it'll",
 "it's",
 'its',
 'itself',
 "i've",
 'just',
 'll',
 'm',
 'ma',
 'me',
 'mightn',
 "mightn't",
 'more',
 'most',
 'mustn',
 "mustn't",
 'my',
 'myself',
 'needn',
 "needn't",
 'no',
 'nor',
 'not',
 'now',
 'o',
 'of',
 'off',
 'on',
 'once',
 'on

In [5]:
stopwords.words("german")

['aber',
 'alle',
 'allem',
 'allen',
 'aller',
 'alles',
 'als',
 'also',
 'am',
 'an',
 'ander',
 'andere',
 'anderem',
 'anderen',
 'anderer',
 'anderes',
 'anderm',
 'andern',
 'anderr',
 'anders',
 'auch',
 'auf',
 'aus',
 'bei',
 'bin',
 'bis',
 'bist',
 'da',
 'damit',
 'dann',
 'der',
 'den',
 'des',
 'dem',
 'die',
 'das',
 'dass',
 'daß',
 'derselbe',
 'derselben',
 'denselben',
 'desselben',
 'demselben',
 'dieselbe',
 'dieselben',
 'dasselbe',
 'dazu',
 'dein',
 'deine',
 'deinem',
 'deinen',
 'deiner',
 'deines',
 'denn',
 'derer',
 'dessen',
 'dich',
 'dir',
 'du',
 'dies',
 'diese',
 'diesem',
 'diesen',
 'dieser',
 'dieses',
 'doch',
 'dort',
 'durch',
 'ein',
 'eine',
 'einem',
 'einen',
 'einer',
 'eines',
 'einig',
 'einige',
 'einigem',
 'einigen',
 'einiger',
 'einiges',
 'einmal',
 'er',
 'ihn',
 'ihm',
 'es',
 'etwas',
 'euer',
 'eure',
 'eurem',
 'euren',
 'eurer',
 'eures',
 'für',
 'gegen',
 'gewesen',
 'hab',
 'habe',
 'haben',
 'hat',
 'hatte',
 'hatten',
 '

In [6]:
stopwords.words("french")

['au',
 'aux',
 'avec',
 'ce',
 'ces',
 'dans',
 'de',
 'des',
 'du',
 'elle',
 'en',
 'et',
 'eux',
 'il',
 'ils',
 'je',
 'la',
 'le',
 'les',
 'leur',
 'lui',
 'ma',
 'mais',
 'me',
 'même',
 'mes',
 'moi',
 'mon',
 'ne',
 'nos',
 'notre',
 'nous',
 'on',
 'ou',
 'par',
 'pas',
 'pour',
 'qu',
 'que',
 'qui',
 'sa',
 'se',
 'ses',
 'son',
 'sur',
 'ta',
 'te',
 'tes',
 'toi',
 'ton',
 'tu',
 'un',
 'une',
 'vos',
 'votre',
 'vous',
 'c',
 'd',
 'j',
 'l',
 'à',
 'm',
 'n',
 's',
 't',
 'y',
 'été',
 'étée',
 'étées',
 'étés',
 'étant',
 'étante',
 'étants',
 'étantes',
 'suis',
 'es',
 'est',
 'sommes',
 'êtes',
 'sont',
 'serai',
 'seras',
 'sera',
 'serons',
 'serez',
 'seront',
 'serais',
 'serait',
 'serions',
 'seriez',
 'seraient',
 'étais',
 'était',
 'étions',
 'étiez',
 'étaient',
 'fus',
 'fut',
 'fûmes',
 'fûtes',
 'furent',
 'sois',
 'soit',
 'soyons',
 'soyez',
 'soient',
 'fusse',
 'fusses',
 'fût',
 'fussions',
 'fussiez',
 'fussent',
 'ayant',
 'ayante',
 'ayantes',


In [34]:
from nltk.stem import PorterStemmer
stemmer = PorterStemmer()
sentences = nltk.sent_tokenize(corpus)
type(sentences)

list

In [15]:
# Apply stopwords and filter the words and then apply stemming

for i in range(len(sentences)):
  words = nltk.word_tokenize(sentences[i])
  words = [stemmer.stem(word) for word in words if word not in set(stopwords.words("english"))]
  sentences[i] = "  ".join(words) 
  

In [17]:
sentences

['good  morn  everyon  ,  today  ,  ’  want  talk  success  .',
 '’  want  talk  failur  either  .',
 'want  talk  space  two  —  part  one  post  linkedin  ,  one  put  instagram  ,  one  applaud  .',
 'space  call  journey  .',
 'see  ,  live  world  celebr  outcom  .',
 'clap  degr  ,  titl  ,  salari  ,  rank  ,  follow  ,  result  .',
 'rare  talk  night  doubt  ,  confu  ,  fear  left  behind  ,  quiet  resili  take  keep  go  nobodi  watch  .',
 'everi  singl  person  sit  today  differ  timelin  .',
 'yet  ,  constantli  compar  chapter  3  someon  el  ’  chapter  20  .',
 'let  tell  someth  import  :  life  race  .',
 'process  .',
 'peopl  discov  purpo  earli  .',
 'discov  late  .',
 'chang  multipl  time  .',
 'none  make  behind  .',
 'put  behind  quit  progress  ’  look  like  someon  el  ’  highlight  reel  .',
 'moment  question  abil  .',
 'moment  wonder  chose  right  path  .',
 'moment  feel  like  everyon  el  figur  except  .',
 'let  honest  —  peopl  figur  g

In [19]:
from nltk.stem import SnowballStemmer
snowStem = SnowballStemmer("english")

In [30]:
for i in range(len(sentences)):
  words = nltk.word_tokenize(sentences[i])
  words = [snowStem.stem(word) for word in words if word not in set(stopwords.words("english"))]
  sentences[i] = "  ".join(words)

In [31]:
sentences

['good  morn  everyon  ,  today  ,  i  ’  want  talk  success  .',
 'i  ’  want  talk  failur  either  .',
 'i  want  talk  space  two  —  part  one  post  linkedin  ,  one  put  instagram  ,  one  applaud  .',
 'that  space  call  journey  .',
 'you  see  ,  live  world  celebr  outcom  .',
 'we  clap  degre  ,  titl  ,  salari  ,  rank  ,  follow  ,  result  .',
 'but  rare  talk  night  doubt  ,  confus  ,  fear  left  behind  ,  quiet  resili  take  keep  go  nobodi  watch  .',
 'everi  singl  person  sit  today  differ  timelin  .',
 'and  yet  ,  constant  compar  chapter  3  someon  els  ’  chapter  20  .',
 'let  tell  someth  import  :  life  race  .',
 'it  process  .',
 'some  peopl  discov  purpos  earli  .',
 'some  discov  late  .',
 'some  chang  multipl  time  .',
 'none  make  behind  .',
 'what  put  behind  quit  progress  ’  look  like  someon  els  ’  highlight  reel  .',
 'you  moment  question  abil  .',
 'moment  wonder  chose  right  path  .',
 'moment  feel  l

In [23]:
from nltk.stem import WordNetLemmatizer
wnl = WordNetLemmatizer()

In [37]:
for i in range(len(sentences)):
  words = nltk.word_tokenize(sentences[i])
  words = [wnl.lemmatize(word.lower(), pos="v") for word in words if word not in set(stopwords.words("english"))]
  sentences[i] = "  ".join(words)

In [38]:
sentences

['good  morning  everyone  ,  today  ,  i  ’  want  talk  success  .',
 'i  ’  want  talk  failure  either  .',
 'i  want  talk  space  two  —  part  one  post  linkedin  ,  one  put  instagram  ,  one  applaud  .',
 'that  space  call  journey  .',
 'you  see  ,  live  world  celebrate  outcomes  .',
 'we  clap  degrees  ,  title  ,  salaries  ,  rankings  ,  followers  ,  result  .',
 'but  rarely  talk  nights  doubt  ,  confusion  ,  fear  leave  behind  ,  quiet  resilience  take  keep  go  nobody  watch  .',
 'every  single  person  sit  today  different  timeline  .',
 'and  yet  ,  constantly  compare  chapter  3  someone  else  ’  chapter  20  .',
 'let  tell  something  important  :  life  race  .',
 'it  process  .',
 'some  people  discover  purpose  early  .',
 'some  discover  late  .',
 'some  change  multiple  time  .',
 'none  make  behind  .',
 'what  put  behind  quit  progress  ’  look  like  someone  else  ’  highlight  reel  .',
 'you  moments  question  abilities