Import Required Libraries

In [None]:
import pandas as pd
import nltk, re
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.metrics.pairwise import cosine_similarity

 Import NLTK Resources

In [None]:
nltk.download('stopwords')
from nltk.corpus import stopwords
stop_words = set(stopwords.words("english"))

[nltk_data] Downloading package stopwords to /root/nltk_data...
[nltk_data]   Package stopwords is already up-to-date!


Load Dataset (upload CSV in Colab first)

In [None]:
df = pd.read_csv("Reviews.csv", on_bad_lines="skip", engine="python")
reviews = df['Text'].dropna().head(10000)

Preprocessing Function

In [None]:
def preprocess(text):
    text = text.lower()
    text = re.sub(r'[^a-z\s]', '', text)  # remove punctuation
    tokens = [w for w in text.split() if w not in stop_words]
    return " ".join(tokens)

 Apply preprocessing

In [None]:
cleaned = reviews.apply(preprocess)

vectorizer = TfidfVectorizer()
X = vectorizer.fit_transform(cleaned)

Function to query

In [None]:
def search_reviews(query, k=5):
    q = preprocess(query)
    q_vec = vectorizer.transform([q])
    sims = cosine_similarity(q_vec, X).flatten()
    idx = sims.argsort()[-k:][::-1]
    for i in idx:
        print(f"\nOriginal: {reviews.iloc[i]}\nCleaned: {cleaned.iloc[i]}")

 Query Examples

In [None]:
print("Query 1: great product with fast shipping")
search_reviews("great product with fast shipping")

print("\nQuery 2: disappointed")
search_reviews("disappointed")

Query 1: great product with fast shipping

Original: Enjoyed the product and they also provided very fast shipping.  I'm about out and need to order more.
Cleaned: enjoyed product also provided fast shipping im need order

Original: The tea is good and fresh. We enjoy it. The shipping is fast and cost is reasonable.<br />I recommend this product.
Cleaned: tea good fresh enjoy shipping fast cost reasonablebr recommend product

Original: My daughter lives in Hawaii and sent me some great coffee from there. I have a Keurig and  was not sure how to use the new coffee. I got these fast fast and now am using my Hawaiian coffee. Great product.
Cleaned: daughter lives hawaii sent great coffee keurig sure use new coffee got fast fast using hawaiian coffee great product

Original: The energy drink is a great product. The shipping price is crazy tho. I paid more for the shipping then both products together, so not a great deal.
Cleaned: energy drink great product shipping price crazy tho paid shi