In [1]:
import nltk
import string
import re
from nltk.corpus import stopwords
from nltk.tokenize import word_tokenize
from nltk.stem import PorterStemmer, WordNetLemmatizer


In [2]:
texts = [
    "Planting trees provides oxygen and improves air quality.",
    "Gardening promotes physical activity and mental well-being.",
    "Plants can reduce stress and enhance relaxation.",
    "Growing your own vegetables ensures fresh and healthy food."
]

In [3]:
nltk.download('punkt')
nltk.download('stopwords')
nltk.download('wordnet')

[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data]   Unzipping tokenizers/punkt.zip.
[nltk_data] Downloading package stopwords to /root/nltk_data...
[nltk_data]   Unzipping corpora/stopwords.zip.
[nltk_data] Downloading package wordnet to /root/nltk_data...


True

In [4]:
stop_words = set(stopwords.words('english'))
stemmer = PorterStemmer()
lemmatizer = WordNetLemmatizer()

In [5]:
def preprocess_text(text):
     text = text.lower()
     text = text.translate(str.maketrans('', '', string.punctuation))
     words = word_tokenize(text)
     words = [word for word in words if word not in stop_words]
     stemmed_words = [stemmer.stem(word) for word in words]
     lemmatized_words = [lemmatizer.lemmatize(word) for word in words]
     text = re.sub(r'\d+', '', text)
     text = ' '.join(text.split())
     return {
        "original": text,
        "stemmed": ' '.join(stemmed_words),
        "lemmatized": ' '.join(lemmatized_words)
    }



In [6]:
preprocessed_texts = [preprocess_text(text) for text in texts]

In [8]:
for i, processed in enumerate(preprocessed_texts):
    print(f"Original: {texts[i]}")
    print(f"Stemmed: {processed['stemmed']}")
    print(f"Lemmatized: {processed['lemmatized']}")
    print("\n")

Original: Planting trees provides oxygen and improves air quality.
Stemmed: plant tree provid oxygen improv air qualiti
Lemmatized: planting tree provides oxygen improves air quality


Original: Gardening promotes physical activity and mental well-being.
Stemmed: garden promot physic activ mental wellb
Lemmatized: gardening promotes physical activity mental wellbeing


Original: Plants can reduce stress and enhance relaxation.
Stemmed: plant reduc stress enhanc relax
Lemmatized: plant reduce stress enhance relaxation


Original: Growing your own vegetables ensures fresh and healthy food.
Stemmed: grow veget ensur fresh healthi food
Lemmatized: growing vegetable ensures fresh healthy food


