In [None]:
import pandas as pd
from sklearn.feature_extraction.text import CountVectorizer
from sklearn.model_selection import train_test_split
from sklearn.naive_bayes import MultinomialNB
from sklearn.metrics import accuracy_score

# Load dataset
comments = pd.read_csv("data/comments.txt", sep='\t', header=None, names=['Comment', 'Sentiment'])
reviews = pd.read_csv("data/reviews.txt", sep='\t', header=None, names=['Comment', 'Sentiment'])
dataset = pd.concat([comments, reviews], axis=0)

# Vectorize text using Bag-of-Words model
vectorizer = CountVectorizer(stop_words='english')
X = vectorizer.fit_transform(dataset['Comment'].values.astype('U'))
y = dataset['Sentiment']

# Split dataset into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.3, random_state=42)

# Train a Multinomial Naive Bayes classifier
clf = MultinomialNB()
clf.fit(X_train, y_train)

# Evaluate the model
y_pred = clf.predict(X_test)
accuracy = accuracy_score(y_test, y_pred)
print(f"Accuracy: {accuracy}")