In [1]:
import pandas as pd
from textblob import TextBlob

# Load dataset (ensure the file has a 'review' column)
data = pd.read_csv("cars_2010_2020.csv")

# Check if 'review' column exists; if not, create dummy reviews
if 'review' not in data.columns:
    # Create a list of reviews with the same length as the DataFrame
    num_reviews = len(data)
    reviews = ["This car is amazing!", "Worst experience ever.",
              "It's an average vehicle.", "I love this car!",
              "The engine performance is terrible."]
    # Extend the reviews list to match the DataFrame length
    data['review'] = reviews * (num_reviews // len(reviews)) + reviews[:num_reviews % len(reviews)]
else:
    # If the review column exists, fill missing values with an empty string
    data['review'] = data['review'].fillna("")

# Function to get sentiment polarity
def get_sentiment(text):
    return TextBlob(text).sentiment.polarity

# Apply sentiment analysis
data['sentiment'] = data['review'].apply(get_sentiment)

# Print sample results
print(data[['review', 'sentiment']].head())

                                review  sentiment
0                 This car is amazing!      0.750
1               Worst experience ever.     -1.000
2             It's an average vehicle.     -0.150
3                     I love this car!      0.625
4  The engine performance is terrible.     -1.000
