### Installing Libraries

In [None]:
!pip install numpy scipy
!pip install scikit-learn
!pip install pillow
!pip install h5py

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/


In [None]:
!pip install tensorflow

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting tensorboard<2.10,>=2.9
  Using cached tensorboard-2.9.1-py3-none-any.whl (5.8 MB)
Collecting flatbuffers<2,>=1.12
  Using cached flatbuffers-1.12-py2.py3-none-any.whl (15 kB)
Collecting tensorflow-estimator<2.10.0,>=2.9.0rc0
  Using cached tensorflow_estimator-2.9.0-py2.py3-none-any.whl (438 kB)
Collecting keras<2.10.0,>=2.9.0rc0
  Using cached keras-2.9.0-py2.py3-none-any.whl (1.6 MB)
Installing collected packages: tensorflow-estimator, tensorboard, keras, flatbuffers
  Attempting uninstall: tensorflow-estimator
    Found existing installation: tensorflow-estimator 2.10.0
    Uninstalling tensorflow-estimator-2.10.0:
      Successfully uninstalled tensorflow-estimator-2.10.0
  Attempting uninstall: tensorboard
    Found existing installation: tensorboard 2.10.1
    Uninstalling tensorboard-2.10.1:
      Successfully uninstalled tensorboard-2.10.1
  Attempting uninstall: keras


In [None]:
!pip install keras

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/


In [None]:
!pip install tensorflow-gpu

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting tensorboard<2.11,>=2.10
  Using cached tensorboard-2.10.1-py3-none-any.whl (5.9 MB)
Collecting tensorflow-estimator<2.11,>=2.10.0
  Using cached tensorflow_estimator-2.10.0-py2.py3-none-any.whl (438 kB)
Collecting flatbuffers>=2.0
  Using cached flatbuffers-22.9.24-py2.py3-none-any.whl (26 kB)
Collecting keras<2.11,>=2.10.0
  Using cached keras-2.10.0-py2.py3-none-any.whl (1.7 MB)
Installing collected packages: tensorflow-estimator, tensorboard, keras, flatbuffers
  Attempting uninstall: tensorflow-estimator
    Found existing installation: tensorflow-estimator 2.9.0
    Uninstalling tensorflow-estimator-2.9.0:
      Successfully uninstalled tensorflow-estimator-2.9.0
  Attempting uninstall: tensorboard
    Found existing installation: tensorboard 2.9.1
    Uninstalling tensorboard-2.9.1:
      Successfully uninstalled tensorboard-2.9.1
  Attempting uninstall: keras
    Found e

In [None]:
!pip install ann_visualizer graphviz

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/


In [None]:
from tensorflow.keras.models import Sequential
from tensorflow.keras.losses import categorical_crossentropy
from tensorflow.keras.optimizers import SGD
from tensorflow.keras.layers import Dense
 
from numpy import argmax
import numpy as np
import re

### Input Training Data

In [None]:
X = [ "Vitamin D", 
      "Weakness", 
      "Tooth Pain", 
      "Vomitings", 
      "Body pains", 
      "Throat Pain",
      "Stomach Pain",
      "Skin Infection",
      "Minor Burns",
      "Diabetes",
      "Blood Pressure",
      "Thyroid",
      "Minor-Cuts",
      "Cold",
      "Cough",
      "Ear Pain",
      "Septic",
      "Prevention of Heart Attack",
      "KidneyStone",
      "Gastric"]

In [None]:
Y = ['D-rise60k',
     'Supradyn',
     'Paracetamol',
     'Domperidone',
     'Coquitmbiflam',
     'Eryctro',
     'Cyclopam',
     'Fluconazole',
     'Burnol(Oientiment)',
     'Metformin',
     'Losartin',
     'Thyronorm',
     'Betnovate-N(Oientiment)',
     'Citrogen',
     'Kuff-Q',
     'Candibiotic(Drops)',
     'Tetanus Vaccine',
     'Sorditrate',
     'Sustain',
     'Pantoprazole']

In [None]:
print(len(X))
print(len(Y))

20
20


### Text Processing

## Removing Non-Alpha Numeric characters

In [None]:
def remove_non_alpha_numeric_characters(sentence):
    new_sentence = ''
    for token in sentence:
        if token.isalpha() or token == ' ':
            new_sentence += token
    return new_sentence

In [None]:
def preprocess_data(X):
    X = [data_point.lower() for data_point in X]
    X = [remove_non_alpha_numeric_characters(sentence) for sentence in X]
    X = [data_point.strip() for data_point in X]
    X = [re.sub(' +', ' ',data_point) for data_point in X]
    return X

In [None]:
X = preprocess_data(X)

vocabulary = set()
for data_point in X:
    for word in data_point.split(' '):
        vocabulary.add(word)

vocabulary = list(vocabulary)
print(vocabulary)
print(len(vocabulary))

['gastric', 'tooth', 'weakness', 'd', 'thyroid', 'attack', 'vitamin', 'stomach', 'vomitings', 'infection', 'throat', 'heart', 'skin', 'burns', 'pains', 'cold', 'blood', 'septic', 'ear', 'cough', 'diabetes', 'prevention', 'pain', 'of', 'body', 'minor', 'minorcuts', 'kidneystone', 'pressure']
29


### Splitting a Sentence

In [None]:
"hey hello hi there".split(' ')

['hey', 'hello', 'hi', 'there']

## Create document vectors

In [None]:
X_encoded = []

def encode_sentence(sentence):
    sentence = preprocess_data([sentence])[0]
    # print(preprocess_data([sentence]))
    # print(preprocess_data([sentence])[0])
    sentence_encoded = [0] * len(vocabulary)
    for i in range(len(vocabulary)):
        if vocabulary[i] in sentence.split(' '):
            sentence_encoded[i] = 1
    return sentence_encoded

X_encoded = [encode_sentence(sentence) for sentence in X]
print(X_encoded)

[[0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1], [0, 0, 0, 0, 1, 0, 0

In [None]:
classes = list(set(Y))
print(classes)
Y_encoded = []
for data_point in Y:
    data_point_encoded = [0] * len(classes)
    for i in range(len(classes)):
        if classes[i] == data_point:
            data_point_encoded[i] = 1
    Y_encoded.append(data_point_encoded)

print(Y_encoded)

['Thyronorm', 'Coquitmbiflam', 'Sorditrate', 'Eryctro', 'Metformin', 'Pantoprazole', 'Tetanus Vaccine', 'Citrogen', 'Cyclopam', 'Losartin', 'Betnovate-N(Oientiment)', 'Sustain', 'Kuff-Q', 'Domperidone', 'Paracetamol', 'Supradyn', 'Candibiotic(Drops)', 'Burnol(Oientiment)', 'D-rise60k', 'Fluconazole']
[[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0], [0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1], [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0], [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [1, 0, 0, 0, 0,

# Create training data and test data

In [None]:
X_train = X_encoded
y_train = Y_encoded
X_test = X_encoded
y_test = Y_encoded

In [None]:
from sklearn.model_selection import train_test_split
X_train, X_test, y_train, y_test = train_test_split(X_encoded,Y_encoded, train_size=0.8, random_state=123, shuffle=True)

In [None]:
print (y_test)

[[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0], [0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0], [0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0]]


In [None]:
print(len(X_train))

16


In [None]:
y_train

[[0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1],
 [0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
 [1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0],
 [0, 0, 0, 0, 0, 0, 0, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,

# Model training

In [None]:
model = Sequential()
model.add(Dense(units=64, activation='sigmoid',
                input_dim=len(X_train[0])))
model.add(Dense(units=len(y_train[0]), activation='softmax'))
model.compile(loss=categorical_crossentropy,
              optimizer=SGD(lr=0.01,
                            momentum=0.9, nesterov=True))

model.fit(np.array(X_train), np.array(y_train), epochs=100, batch_size=1)

Epoch 1/100


  super().__init__(name, **kwargs)


Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100
Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
Epoch 73/100
Epoch 74/100
Epoch 75/100
Epoch 76/100
Epoch 77/100
Epoch 78/100
Epoch 7

<keras.callbacks.History at 0x7f07a19d7e10>

In [None]:
print("The model summary is this.It shows the model structure", model.summary())

Model: "sequential"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense (Dense)               (None, 64)                1920      
                                                                 
 dense_1 (Dense)             (None, 20)                1300      
                                                                 
Total params: 3,220
Trainable params: 3,220
Non-trainable params: 0
_________________________________________________________________
The model summary is this.It shows the model structure None


In [None]:
from ann_visualizer.visualize import ann_viz
ann_viz(model, title="Nueral Network for Healthbot looks")

## List down predictions

In [None]:
predicted_value = model.predict(np.array(X_test))
predictions = [argmax(pred) for pred in model.predict(np.array(X_test))]
print("The predicted value is", predicted_value)
print("The predicted value using argmax is", predictions)
print("The actual value is", y_test)

The predicted value is [[6.5070309e-02 4.3575457e-04 4.0945449e-04 4.0358712e-04 1.2328901e-01
  9.9191152e-02 7.4868038e-02 7.3479109e-02 1.4218960e-02 3.4240350e-02
  7.7242412e-02 9.6497320e-02 3.6675445e-04 8.5024543e-02 1.5362038e-02
  1.0389740e-01 2.1170113e-02 4.1615538e-02 3.7509117e-02 3.5708956e-02]
 [9.0173520e-03 1.9336716e-04 2.3949450e-04 1.8281673e-04 1.2116299e-02
  2.7421480e-02 2.2901729e-02 1.8859515e-02 2.2890691e-01 7.3798173e-03
  3.4305956e-02 2.2511993e-02 1.9312518e-04 1.7429413e-02 2.6373231e-01
  2.3443932e-02 2.8108248e-01 1.0899930e-02 8.4076999e-03 1.0774379e-02]
 [7.4112900e-02 4.4769063e-04 4.3037484e-04 4.3114778e-04 6.9332071e-02
  6.4127274e-02 1.1467110e-01 8.4457919e-02 1.9725915e-02 2.5129534e-02
  8.0040947e-02 1.3868453e-01 4.2482530e-04 8.1215426e-02 2.0997571e-02
  9.0478644e-02 2.7229078e-02 3.5179134e-02 3.4856308e-02 3.8027577e-02]
 [8.4636576e-02 3.8133588e-04 3.5818067e-04 3.1339694e-04 6.1319750e-02
  8.0707349e-02 9.7597249e-02 1.167818

# Model Evaluation

In [None]:
correct = 0
for i in range(len(predictions)):
    if predictions[i] == argmax(y_test[i]):
        correct += 1

print ("Correct:", correct)
print ("Total:", len(predictions))

Correct: 0
Total: 4


# Testing the chatbot

In [None]:

while True:
    print (X)
    sentence = input()
    if sentence == 'quit':
      break
    else:
      prediction= model.predict(np.array([encode_sentence(sentence)]))
      print (classes[argmax(prediction)])


['vitamin d', 'weakness', 'tooth pain', 'vomitings', 'body pains', 'throat pain', 'stomach pain', 'skin infection', 'minor burns', 'diabetes', 'blood pressure', 'thyroid', 'minorcuts', 'cold', 'cough', 'ear pain', 'septic', 'prevention of heart attack', 'kidneystone', 'gastric']
['D-rise60k', 'Supradyn', 'Paracetamol', 'Domperidone', 'Coquitmbiflam', 'Eryctro', 'Cyclopam', 'Fluconazole', 'Burnol(Oientiment)', 'Metformin', 'Losartin', 'Thyronorm', 'Betnovate-N(Oientiment)', 'Citrogen', 'Kuff-Q', 'Candibiotic(Drops)', 'Tetanus Vaccine', 'Sorditrate', 'Sustain', 'Pantoprazole']
vitamin d
D-rise60k
['vitamin d', 'weakness', 'tooth pain', 'vomitings', 'body pains', 'throat pain', 'stomach pain', 'skin infection', 'minor burns', 'diabetes', 'blood pressure', 'thyroid', 'minorcuts', 'cold', 'cough', 'ear pain', 'septic', 'prevention of heart attack', 'kidneystone', 'gastric']
['D-rise60k', 'Supradyn', 'Paracetamol', 'Domperidone', 'Coquitmbiflam', 'Eryctro', 'Cyclopam', 'Fluconazole', 'Burnol

KeyboardInterrupt: ignored