**Step 1: Install NLTK Library**

In [None]:
!pip install nltk



**Step 2: Import Required Libraries**

In [None]:
import nltk
from nltk.stem import PorterStemmer, WordNetLemmatizer
from nltk.corpus import wordnet
from nltk.tokenize import word_tokenize

**Step 3: Download NLTK Resources**

In [None]:
nltk.download('punkt')
nltk.download('wordnet')
nltk.download('averaged_perceptron_tagger')

[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data]   Unzipping tokenizers/punkt.zip.
[nltk_data] Downloading package wordnet to /root/nltk_data...
[nltk_data] Downloading package averaged_perceptron_tagger to
[nltk_data]     /root/nltk_data...
[nltk_data]   Unzipping taggers/averaged_perceptron_tagger.zip.


True

**Step 4: Define the Stemming Function**

In [None]:
def stem_words(words):
    ps = PorterStemmer()
    return [ps.stem(word) for word in words]


**Step 5: Define a Function to Map POS Tags for Lemmatization**

In [None]:
def get_wordnet_pos(word):
    """Map POS tag to first character lemmatize() accepts"""
    tag = nltk.pos_tag([word])[0][1][0].upper()
    tag_dict = {"J": wordnet.ADJ, "N": wordnet.NOUN, "V": wordnet.VERB, "R": wordnet.ADV}

    return tag_dict.get(tag, wordnet.NOUN)

**Step 6: Define the Lemmatization Function**

In [None]:
def lemmatize_words(words):
    lemmatizer = WordNetLemmatizer()
    return [lemmatizer.lemmatize(word, get_wordnet_pos(word)) for word in words]

**Step 7: Define a Function to Preprocess Text**

In [None]:
def preprocess_text(text):
    return word_tokenize(text.lower())

**Step 8: Apply the Preprocessing, Stemming, and Lemmatization**

In [None]:
text = "She sells seashells by the seashore."
words = preprocess_text(text)

stemmed_words = stem_words(words)
lemmatized_words = lemmatize_words(words)

print("Original Sentence:", text)
print("Stemmed Sentence:", stemmed_words)
print("Lemmatized Sentence:", lemmatized_words)


Original Sentence: She sells seashells by the seashore.
Stemmed Sentence: ['she', 'sell', 'seashel', 'by', 'the', 'seashor', '.']
Lemmatized Sentence: ['she', 'sell', 'seashell', 'by', 'the', 'seashore', '.']
