Load training and testing data from CSV files.

In [None]:
import pandas as pd
train_data = pd.read_csv('train.csv')
test_data = pd.read_csv('test.csv')

Preprocess the text data by converting it into numerical features using TF-IDF.

In [None]:
from sklearn.feature_extraction.text import TfidfVectorizer
vectorizer = TfidfVectorizer()
X_train = vectorizer.fit_transform(train_data['text'])
X_test = vectorizer.transform(test_data['text'])

Initialize the TPOT classifier for automated machine learning.

In [None]:
from tpot import TPOTClassifier
tpot = TPOTClassifier(verbosity=2)


Train the model using the training data.

In [None]:
tpot.fit(X_train, train_data['label'])

Export the trained model to a Python file.

In [None]:
tpot.export('best_model.py')

Make predictions on the test data.

In [None]:
predictions = tpot.predict(X_test)

Create a submission file from the predictions.

In [None]:
submission = pd.DataFrame({'id': test_data['id'], 'prediction': predictions})
submission.to_csv('submission.csv', index=False)

Visualize the predictions using a histogram.

In [None]:
import matplotlib.pyplot as plt
plt.hist(predictions)
plt.title('Histogram of Predictions')
plt.show()