In [None]:
import pandas as pd
from sklearn.model_selection import train_test_split
from sklearn.preprocessing import LabelEncoder

In [None]:
# Load dataset (Ensure you have a labeled dataset)
df = pd.read_csv("chatbot_dataset.csv")

In [None]:
# Encode labels
label_encoder = LabelEncoder()
df['label'] = label_encoder.fit_transform(df['category'])

In [None]:
# Split data
X_train, X_test, y_train, y_test = train_test_split(df['text'], df['label'], test_size=0.2, random_state=42)

In [None]:
from sentence_transformers import SentenceTransformer
import numpy as np

In [None]:
embed_model = SentenceTransformer('all-MiniLM-L6-v2')

In [None]:
def embed_texts(texts):
    return np.array(embed_model.encode(texts))

In [None]:
X_train_vectors = embed_texts(X_train.tolist())
X_test_vectors = embed_texts(X_test.tolist())

In [None]:
import torch
import torch.nn as nn
import torch.optim as optim

class ChatbotModel(nn.Module):
    def __init__(self, input_dim, output_dim):
        super(ChatbotModel, self).__init__()
        self.fc1 = nn.Linear(input_dim, 256)
        self.fc2 = nn.Linear(256, output_dim)
    
    def forward(self, x):
        x = torch.relu(self.fc1(x))
        return self.fc2(x)

In [None]:
# Define model
model = ChatbotModel(input_dim=384, output_dim=len(label_encoder.classes_))


In [None]:
# Loss function and optimizer
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)

In [None]:
X_train_torch = torch.tensor(X_train_vectors, dtype=torch.float32)
y_train_torch = torch.tensor(y_train, dtype=torch.long)

In [None]:
num_epochs = 10
for epoch in range(num_epochs):
    optimizer.zero_grad()
    outputs = model(X_train_torch)
    loss = criterion(outputs, y_train_torch)
    loss.backward()
    optimizer.step()
    print(f'Epoch {epoch+1}/{num_epochs}, Loss: {loss.item()}')

In [None]:
from sklearn.metrics import classification_report

X_test_torch = torch.tensor(X_test_vectors, dtype=torch.float32)
y_test_pred = torch.argmax(model(X_test_torch), axis=1).numpy()


In [None]:
print(classification_report(y_test, y_test_pred, target_names=label_encoder.classes_))

In [None]:
torch.save(model.state_dict(), "chatbot_model.pth")