In [1]:
import json
import pandas as pd
import numpy as np
import random
import pickle
import nltk
nltk.download('omw-1.4')
from nltk.stem import WordNetLemmatizer

from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense, Activation, Dropout
from tensorflow.keras.optimizers import SGD

lemmatizer = WordNetLemmatizer()

intents = json.loads(open('intents.json').read())

words = []
classes = []
documents = []
ignore_letters = ['>','!,','.',',']


for intent in intents['intents']:
    for pattern in intent['patterns']:
        word_list = nltk.word_tokenize(pattern)
        words.extend(word_list)
        documents.append((word_list, intent['tag']))
        if intent['tag'] not in classes:
            classes.append(intent['tag'])

print(documents)

[nltk_data] Downloading package omw-1.4 to
[nltk_data]     C:\Users\elirj\AppData\Roaming\nltk_data...
[nltk_data]   Package omw-1.4 is already up-to-date!


[(['hello'], 'greetings'), (['hi'], 'greetings'), (['hey'], 'greetings'), (['hola'], 'greetings'), (['good', 'day'], 'greetings'), (['salutations'], 'greetings'), (['Yoo'], 'greetings'), (['I', 'am', 'here', 'to', 'check', 'if', 'I', 'have', 'the', 'virus'], 'diagnosis'), (['I', 'think', 'I', 'have', 'to', 'be', 'diagnosed'], 'diagnosis'), (['Can', 'you', 'diagnose', 'me', '?'], 'diagnosis'), (['I', 'think', 'I', "'m", 'Sick'], 'sick'), (['I', 'might', 'have', 'the', 'virus'], 'sick'), (['I', 'do', "n't", 'feel', 'well'], 'sick'), (['I', 'think', 'I', 'might', 'have', 'been', 'infected'], 'sick'), (['I', 'have', 'received', 'my', 'first', 'and', 'second', 'dose'], 'vaccination'), (['I', 'have', 'the', 'vaccination'], 'vaccination'), (['I', 'am', 'vaccinated', 'including', 'the', 'third', 'booster'], 'vaccination'), (['Yes', 'I', 'have', 'received', 'vaccination'], 'vaccination_positive'), (['yes', ',', 'I', 'have', 'one'], 'vaccination_positive'), (['I', 'have', 'the', 'vaccination'], 

In [2]:

# import json
# intents = json.loads(open('intents.json', 'r+').read())
# print(json.dumps(intents, indent=4))

In [3]:
words = [lemmatizer.lemmatize(word) for word in words if word not in ignore_letters]
words = sorted(set(words))
classes = sorted(set(classes))

pickle.dump(words, open('words.pkl', 'wb'))
pickle.dump(classes, open('classes.pkl', 'wb'))

training = []
output_empty = [0] * len(classes)

for document in documents:
    bag = []
    word_patterns = document[0]
    word_patterns = [lemmatizer.lemmatize(word.lower()) for word in word_patterns]
    for word in words:
        bag.append(1) if word in word_patterns else bag.append(0)
        
    output_row = list(output_empty)
    output_row[classes.index(document[1])] = 1
    training.append([bag, output_row])
    
random.shuffle(training)
training = np.array(training)

train_x = list(training[:,0])
train_y = list(training[:,1])
print(words)

["'m", '?', 'Can', 'How', 'I', 'Is', 'Later', 'May', 'No', 'See', 'Sick', 'What', 'Who', 'Yes', 'Yoo', 'age', 'am', 'and', 'are', 'ask', 'be', 'been', 'bleeding', 'bone', 'booster', 'born', 'broken', 'bye', 'campus', 'care', 'check', 'college', 'concussion', 'contageous', 'covid', 'cya', 'day', 'diagnose', 'diagnosed', 'diarrhea', 'do', 'dose', 'enter', 'feel', 'fever', 'first', 'flu', 'good', 'have', 'headache', 'hello', 'here', 'hey', 'hi', 'hola', 'if', 'impact', 'including', 'infected', 'is', 'it', 'me', 'might', 'my', "n't", 'name', 'not', 'old', 'one', 'please', 'possible', 'rash', 'received', 'salutation', 'screen', 'second', 'skin', 'sore', 'swelling', 'take', 'tell', 'the', 'think', 'third', 'this', 'tiredness', 'to', 'vaccinated', 'vaccination', 'virus', 'vomit', 'well', 'were', 'what', 'who', 'will', 'wound', 'year', 'yes', 'you', 'your']


In [4]:
model = Sequential()
model.add(Dense(128, input_shape=(len(train_x[0]),), activation="relu"))
model.add(Dropout(0.5))
model.add(Dense(64, activation="relu"))
model.add(Dropout(0.5))
model.add(Dense(len(train_y[0]), activation="softmax"))


In [5]:
sgd = SGD(lr=0.01, decay=1e-6, momentum=0.9, nesterov=True)
model.compile(loss='categorical_crossentropy', optimizer=sgd, metrics=['accuracy'])
model.fit(np.array(train_x), np.array(train_y), epochs=10, batch_size=5,)
hist = model.fit(np.array(train_x), np.array(train_y), epochs=200, batch_size=5, verbose=1)
model.save("model.h5", hist)
print("Done")

Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
Epoch 1/200
Epoch 2/200
Epoch 3/200
Epoch 4/200
Epoch 5/200
Epoch 6/200
Epoch 7/200
Epoch 8/200
Epoch 9/200
Epoch 10/200
Epoch 11/200
Epoch 12/200
Epoch 13/200
Epoch 14/200
Epoch 15/200
Epoch 16/200
Epoch 17/200
Epoch 18/200
Epoch 19/200
Epoch 20/200
Epoch 21/200
Epoch 22/200
Epoch 23/200
Epoch 24/200
Epoch 25/200
Epoch 26/200
Epoch 27/200
Epoch 28/200
Epoch 29/200
Epoch 30/200
Epoch 31/200
Epoch 32/200
Epoch 33/200
Epoch 34/200
Epoch 35/200
Epoch 36/200
Epoch 37/200
Epoch 38/200
Epoch 39/200
Epoch 40/200
Epoch 41/200
Epoch 42/200
Epoch 43/200
Epoch 44/200
Epoch 45/200
Epoch 46/200
Epoch 47/200
Epoch 48/200
Epoch 49/200
Epoch 50/200
Epoch 51/200
Epoch 52/200
Epoch 53/200
Epoch 54/200
Epoch 55/200
Epoch 56/200
Epoch 57/200
Epoch 58/200
Epoch 59/200
Epoch 60/200
Epoch 61/200
Epoch 62/200
Epoch 63/200
Epoch 64/200
Epoch 65/200
Epoch 66/200
Epoch 67/200
Epoch 68/200
Epoch 69/200
E

Epoch 72/200
Epoch 73/200
Epoch 74/200
Epoch 75/200
Epoch 76/200
Epoch 77/200
Epoch 78/200
Epoch 79/200
Epoch 80/200
Epoch 81/200
Epoch 82/200
Epoch 83/200
Epoch 84/200
Epoch 85/200
Epoch 86/200
Epoch 87/200
Epoch 88/200
Epoch 89/200
Epoch 90/200
Epoch 91/200
Epoch 92/200
Epoch 93/200
Epoch 94/200
Epoch 95/200
Epoch 96/200
Epoch 97/200
Epoch 98/200
Epoch 99/200
Epoch 100/200
Epoch 101/200
Epoch 102/200
Epoch 103/200
Epoch 104/200
Epoch 105/200
Epoch 106/200
Epoch 107/200
Epoch 108/200
Epoch 109/200
Epoch 110/200
Epoch 111/200
Epoch 112/200
Epoch 113/200
Epoch 114/200
Epoch 115/200
Epoch 116/200
Epoch 117/200
Epoch 118/200
Epoch 119/200
Epoch 120/200
Epoch 121/200
Epoch 122/200
Epoch 123/200
Epoch 124/200
Epoch 125/200
Epoch 126/200
Epoch 127/200
Epoch 128/200
Epoch 129/200
Epoch 130/200
Epoch 131/200
Epoch 132/200
Epoch 133/200
Epoch 134/200
Epoch 135/200
Epoch 136/200
Epoch 137/200
Epoch 138/200
Epoch 139/200
Epoch 140/200
Epoch 141/200
Epoch 142/200
Epoch 143/200
Epoch 144/200
Epoch 

Epoch 151/200
Epoch 152/200
Epoch 153/200
Epoch 154/200
Epoch 155/200
Epoch 156/200
Epoch 157/200
Epoch 158/200
Epoch 159/200
Epoch 160/200
Epoch 161/200
Epoch 162/200
Epoch 163/200
Epoch 164/200
Epoch 165/200
Epoch 166/200
Epoch 167/200
Epoch 168/200
Epoch 169/200
Epoch 170/200
Epoch 171/200
Epoch 172/200
Epoch 173/200
Epoch 174/200
Epoch 175/200
Epoch 176/200
Epoch 177/200
Epoch 178/200
Epoch 179/200
Epoch 180/200
Epoch 181/200
Epoch 182/200
Epoch 183/200
Epoch 184/200
Epoch 185/200
Epoch 186/200
Epoch 187/200
Epoch 188/200
Epoch 189/200
Epoch 190/200
Epoch 191/200
Epoch 192/200
Epoch 193/200
Epoch 194/200
Epoch 195/200
Epoch 196/200
Epoch 197/200
Epoch 198/200
Epoch 199/200
Epoch 200/200
Done
