In [None]:

import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.feature_extraction.text import TfidfVectorizer
from sklearn.linear_model import LogisticRegression
from sklearn.metrics import accuracy_score, classification_report
data = {
    'Ingredient Name': ['Acetaminophen', 'Ibuprofen', 'Aspirin', 'Pseudoephedrine',
                       'Diphenhydramine', 'Loratadine', 'Cetirizine', 'Famotidine',
                       'Omeprazole', 'Simvastatin', 'Atorvastatin', 'Metformin',
                       'Glipizide', 'Lisinopril', 'Hydrochlorothiazide', 'Amlodipine',
                       'Warfarin', 'Levothyroxine', 'Albuterol', 'Salbutamol'],
    'Chemical Composition': ['C8H9NO2', 'C13H18O2', 'C9H8O4', 'C10H15NO',
                             'C17H21NO', 'C22H23ClN2O2', 'C21H25ClN2O3', 'C13H14N4O3S',
                             'C17H19N3O3S', 'C25H38O5', 'C33H35FN2O6', 'C4H11N5O',
                             'C17H21N3O4S', 'C21H31N3O5', 'C7H8ClN3O4S', 'C20H25ClN2O5',
                             'C19H16O4', 'C15H11I4NO4', 'C13H21NO3', 'C13H21NO3'],
    'Disposal Method': ['Household Trash', 'Household Trash', 'Household Trash', 'Avoid Flushing',
                        'Avoid Flushing', 'Household Trash', 'Household Trash', 'Avoid Flushing',
                        'Avoid Flushing', 'Avoid Flushing', 'Avoid Flushing', 'Avoid Flushing',
                        'Avoid Flushing', 'Avoid Flushing', 'Avoid Flushing', 'Avoid Flushing',
                        'Avoid Flushing', 'Avoid Flushing', 'Avoid Flushing', 'Avoid Flushing']
}

df = pd.DataFrame(data)

# Preprocess the data
X = df['Chemical Composition']
y = df['Disposal Method']

# Split the data into training and testing sets
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)

# Feature extraction using TF-IDF
vectorizer = TfidfVectorizer()
X_train_vec = vectorizer.fit_transform(X_train)
X_test_vec = vectorizer.transform(X_test)

# Train a logistic regression model
model = LogisticRegression()
model.fit(X_train_vec, y_train)

# Make predictions on the test set
y_pred = model.predict(X_test_vec)

# Example prediction for a new ingredient
new_ingredient_composition = input()
new_ingredient_vec = vectorizer.transform([new_ingredient_composition])
predicted_disposal = model.predict(new_ingredient_vec)[0]
print(f"Predicted disposal method for {new_ingredient_composition}: {predicted_disposal}")


Loratadine
Predicted disposal method for Loratadine: Avoid Flushing
