In [1]:
paragraph = "Natural Language Processing (NLP) is a fascinating field within artificial intelligence that enables computers to understand, interpret, and generate human language. For instance, imagine you're having a conversation with a digital assistant like me, and you're asking about the best restaurants in your area. Using NLP, I can analyze your query, understand your preferences, and provide a curated list of top-rated eateries nearby. Moreover, NLP powers applications like sentiment analysis, where businesses can gauge customer emotions from reviews, and language translation services, breaking down language barriers and facilitating global communication. The ability of NLP to bridge the gap between human and machine communication opens up a world of possibilities, making technology more intuitive and accessible."

In [2]:
from nltk.stem import PorterStemmer

In [3]:
from nltk.corpus import stopwords

In [4]:
import nltk
nltk.download('stopwords')

[nltk_data] Downloading package stopwords to C:\Users\Dell
[nltk_data]     G5\AppData\Roaming\nltk_data...
[nltk_data]   Package stopwords is already up-to-date!


True

In [5]:
stopwords.words('english')

['i',
 'me',
 'my',
 'myself',
 'we',
 'our',
 'ours',
 'ourselves',
 'you',
 "you're",
 "you've",
 "you'll",
 "you'd",
 'your',
 'yours',
 'yourself',
 'yourselves',
 'he',
 'him',
 'his',
 'himself',
 'she',
 "she's",
 'her',
 'hers',
 'herself',
 'it',
 "it's",
 'its',
 'itself',
 'they',
 'them',
 'their',
 'theirs',
 'themselves',
 'what',
 'which',
 'who',
 'whom',
 'this',
 'that',
 "that'll",
 'these',
 'those',
 'am',
 'is',
 'are',
 'was',
 'were',
 'be',
 'been',
 'being',
 'have',
 'has',
 'had',
 'having',
 'do',
 'does',
 'did',
 'doing',
 'a',
 'an',
 'the',
 'and',
 'but',
 'if',
 'or',
 'because',
 'as',
 'until',
 'while',
 'of',
 'at',
 'by',
 'for',
 'with',
 'about',
 'against',
 'between',
 'into',
 'through',
 'during',
 'before',
 'after',
 'above',
 'below',
 'to',
 'from',
 'up',
 'down',
 'in',
 'out',
 'on',
 'off',
 'over',
 'under',
 'again',
 'further',
 'then',
 'once',
 'here',
 'there',
 'when',
 'where',
 'why',
 'how',
 'all',
 'any',
 'both',
 'each

In [7]:
stemmer = PorterStemmer()

In [23]:
sentences = nltk.sent_tokenize(paragraph)

In [14]:
# Apply Stopwords And Filter And Then Apply Stemming

for i in range(len(sentences)):
    words = nltk.word_tokenize(sentences[i])
    words = [stemmer.stem(word) for word in words if word not in set(stopwords.words('english'))]
    sentences[i] = ' '.join(words)

In [15]:
sentences

['natur languag process ( nlp ) fascin field within artifici intellig enabl comput understand , interpret , gener human languag .',
 "instanc , imagin 're conver digit assist like , 're ask best restaur area .",
 'use nlp , analyz queri , understand prefer , provid curat list top-rat eateri nearbi .',
 'moreov , nlp power applic like sentiment analysi , busi gaug custom emot review , languag translat servic , break languag barrier facilit global commun .',
 'abil nlp bridg gap human machin commun open world possibl , make technolog intuit access .']

In [16]:
from nltk.stem import SnowballStemmer

In [17]:
snowball = SnowballStemmer('english')

In [19]:
# Apply Stopwords And Filter And Then Apply Snowball Stemming

for i in range(len(sentences)):
    words = nltk.word_tokenize(sentences[i])
    words = [snowball.stem(word) for word in words if word not in set(stopwords.words('english'))]
    sentences[i] = ' '.join(words)

In [20]:
sentences

['natur languag process ( nlp ) fascin field within artifici intellig enabl comput understand , interpret , gener human languag .',
 'instanc , imagin re conver digit assist like , re ask best restaur area .',
 'use nlp , analyz queri , understand prefer , provid curat list top-rat eateri nearbi .',
 'moreov , nlp power applic like sentiment analysi , busi gaug custom emot review , languag translat servic , break languag barrier facilit global commun .',
 'abil nlp bridg gap human machin commun open world possibl , make technolog intuit access .']

In [21]:
from nltk.stem import WordNetLemmatizer

In [22]:
lemmatizer = WordNetLemmatizer()

In [29]:
for i in range(len(sentences)):
    sentences[i] = sentences[i].lower()
    words = nltk.word_tokenize(sentences[i])
    words = [lemmatizer.lemmatize(word,pos='v') for word in words if word not in set(stopwords.words('english'))]
    sentences[i] = ' '.join(words)

In [30]:
sentences

['natural language process ( nlp ) fascinate field within artificial intelligence enable computer understand , interpret , generate human language .',
 "instance , imagine 're conversation digital assistant like , 're ask best restaurant area .",
 'use nlp , analyze query , understand preference , provide curated list top-rated eatery nearby .',
 'moreover , nlp power application like sentiment analysis , business gauge customer emotion review , language translation service , break language barrier facilitate global communication .',
 'ability nlp bridge gap human machine communication open world possibility , make technology intuitive accessible .']