In [1]:
paragraph = """It started as just another uneventful afternoon, the kind where the sky hangs dull and gray like a curtain that forgot how to be blue. 
Out of nowhere, this beat-up ice cream truck rolled into the cul-de-sac, its jingle playing a warped, off-key melody that sounded more like a haunted lullaby than a summer tune. Kids peeked through their curtains but didn’t rush out like usual—something about the driver’s too-wide grin and mirrored sunglasses made everyone hesitate. Still, curiosity’s a powerful thing. One by one, they trickled outside, drawn like moths to a weird, sticky flame. 
But instead of ice cream, the truck was handing out little jars filled with glowing jellybeans—each one pulsing like it had a heartbeat. No one knew what would happen if you ate one, but the neighborhood would never be the same again after that day."""

In [3]:
from nltk.stem import PorterStemmer
from nltk.corpus import stopwords
import nltk

nltk.download('stopwords')

[nltk_data] Downloading package stopwords to
[nltk_data]     C:\Users\hoang\AppData\Roaming\nltk_data...
[nltk_data]   Unzipping corpora\stopwords.zip.


True

In [13]:
stopwords.words('english')

['a',
 'about',
 'above',
 'after',
 'again',
 'against',
 'ain',
 'all',
 'am',
 'an',
 'and',
 'any',
 'are',
 'aren',
 "aren't",
 'as',
 'at',
 'be',
 'because',
 'been',
 'before',
 'being',
 'below',
 'between',
 'both',
 'but',
 'by',
 'can',
 'couldn',
 "couldn't",
 'd',
 'did',
 'didn',
 "didn't",
 'do',
 'does',
 'doesn',
 "doesn't",
 'doing',
 'don',
 "don't",
 'down',
 'during',
 'each',
 'few',
 'for',
 'from',
 'further',
 'had',
 'hadn',
 "hadn't",
 'has',
 'hasn',
 "hasn't",
 'have',
 'haven',
 "haven't",
 'having',
 'he',
 "he'd",
 "he'll",
 'her',
 'here',
 'hers',
 'herself',
 "he's",
 'him',
 'himself',
 'his',
 'how',
 'i',
 "i'd",
 'if',
 "i'll",
 "i'm",
 'in',
 'into',
 'is',
 'isn',
 "isn't",
 'it',
 "it'd",
 "it'll",
 "it's",
 'its',
 'itself',
 "i've",
 'just',
 'll',
 'm',
 'ma',
 'me',
 'mightn',
 "mightn't",
 'more',
 'most',
 'mustn',
 "mustn't",
 'my',
 'myself',
 'needn',
 "needn't",
 'no',
 'nor',
 'not',
 'now',
 'o',
 'of',
 'off',
 'on',
 'once',
 'on

In [14]:
stemmer = PorterStemmer()

In [17]:
sentences = nltk.sent_tokenize(paragraph)
sentences

['It started as just another uneventful afternoon, the kind where the sky hangs dull and gray like a curtain that forgot how to be blue.',
 'Out of nowhere, this beat-up ice cream truck rolled into the cul-de-sac, its jingle playing a warped, off-key melody that sounded more like a haunted lullaby than a summer tune.',
 'Kids peeked through their curtains but didn’t rush out like usual—something about the driver’s too-wide grin and mirrored sunglasses made everyone hesitate.',
 'Still, curiosity’s a powerful thing.',
 'One by one, they trickled outside, drawn like moths to a weird, sticky flame.',
 'But instead of ice cream, the truck was handing out little jars filled with glowing jellybeans—each one pulsing like it had a heartbeat.',
 'No one knew what would happen if you ate one, but the neighborhood would never be the same again after that day.']

In [18]:
type(sentences)

list

In [19]:
## Apply Stopwords and Filter and then Stem the Words

for i in range(len(sentences)):
    words = nltk.word_tokenize(sentences[i])
    words = [stemmer.stem(word) for word in words if word not in set(stopwords.words('english'))]
    sentences[i] = ' '.join(words) # converting all words to a single sentence
sentences

['it start anoth unev afternoon , kind sky hang dull gray like curtain forgot blue .',
 'out nowher , beat-up ice cream truck roll cul-de-sac , jingl play warp , off-key melodi sound like haunt lullabi summer tune .',
 'kid peek curtain ’ rush like usual—someth driver ’ too-wid grin mirror sunglass made everyon hesit .',
 'still , curios ’ power thing .',
 'one one , trickl outsid , drawn like moth weird , sticki flame .',
 'but instead ice cream , truck hand littl jar fill glow jellybeans—each one puls like heartbeat .',
 'no one knew would happen ate one , neighborhood would never day .']

In [20]:
# test on snowballstemmer
from nltk.stem.snowball import SnowballStemmer

snowball_stemmer = SnowballStemmer("english")

In [21]:
## Apply Stopwords and Filter and then Stem the Words

for i in range(len(sentences)):
    words = nltk.word_tokenize(sentences[i])
    words = [snowball_stemmer.stem(word) for word in words if word not in set(stopwords.words('english'))]
    sentences[i] = ' '.join(words) # converting all words to a single sentence
sentences

['start anoth unev afternoon , kind sky hang dull gray like curtain forgot blue .',
 'nowher , beat-up ice cream truck roll cul-de-sac , jingl play warp , off-key melodi sound like haunt lullabi summer tune .',
 'kid peek curtain ’ rush like usual—someth driver ’ too-wid grin mirror sunglass made everyon hesit .',
 'still , curio ’ power thing .',
 'one one , trickl outsid , drawn like moth weird , sticki flame .',
 'instead ice cream , truck hand littl jar fill glow jellybeans—each one pul like heartbeat .',
 'one knew would happen ate one , neighborhood would never day .']

In [22]:
# test on WordNetLemmatizer
from nltk.stem import WordNetLemmatizer

lemmatizer = WordNetLemmatizer()

In [23]:
## Apply Stopwords and Filter and then Stem the Words

for i in range(len(sentences)):
    words = nltk.word_tokenize(sentences[i])
    words = [lemmatizer.lemmatize(word) for word in words if word not in set(stopwords.words('english'))]
    sentences[i] = ' '.join(words) # converting all words to a single sentence
sentences

['start anoth unev afternoon , kind sky hang dull gray like curtain forgot blue .',
 'nowher , beat-up ice cream truck roll cul-de-sac , jingl play warp , off-key melodi sound like haunt lullabi summer tune .',
 'kid peek curtain ’ rush like usual—someth driver ’ too-wid grin mirror sunglass made everyon hesit .',
 'still , curio ’ power thing .',
 'one one , trickl outsid , drawn like moth weird , sticki flame .',
 'instead ice cream , truck hand littl jar fill glow jellybeans—each one pul like heartbeat .',
 'one knew would happen ate one , neighborhood would never day .']