In [None]:
from google.colab import files

uploaded = files.upload()

In [None]:
import pandas as pd
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.pipeline import Pipeline
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score
from sklearn.naive_bayes import MultinomialNB

# Load the data from the Excel file
data = pd.read_excel('training_data.xlsx')

# Split the data into training and testing sets
train_data, test_data = train_test_split(data, test_size=0.5, random_state=42)

# Define the pipeline for the machine learning model
pipeline = Pipeline([
    ('tfidf', TfidfVectorizer()),
    ('clf', MultinomialNB(alpha=0.01))
])

# Fit the pipeline to the training data
pipeline.fit(train_data['input'], train_data['output'])

# Make predictions on the test data
test_predictions = pipeline.predict(test_data['input'])

# Calculate the accuracy of the model on the test data
test_accuracy = accuracy_score(test_data['output'], test_predictions)

# Print the accuracy of the model on the test data
print("Test accuracy: {:.2f}%".format(test_accuracy * 100))

# Print the input and output for each test case
print("Test cases:")
for i, row in test_data.iterrows():
    input_text = row['input']
    expected_output = row['output']
    predicted_output = pipeline.predict([input_text])[0]
    print(f"Input: {input_text}")
    print(f"Expected output: {expected_output}")
    print(f"Predicted output: {predicted_output}\n")