## Import Libraries & Load Dataset

In [1]:
import numpy as np
import pandas as pd
from tensorflow.keras.callbacks import ModelCheckpoint
from tensorflow.keras.models import Model
from tensorflow.keras.optimizers import Adam
from tensorflow.keras.layers import Dense, GRU, Dropout
from tensorflow.keras.utils import to_categorical

## Emoji Classification Dataset

In [2]:
def read_csv(x):
    data = pd.read_csv(x)
    x = data["sentence"].values
    y = data["label"].values
    return x, y

In [3]:
x_train, y_train = read_csv("Emoji_Text_Classification/train.csv")
x_test, y_test = read_csv("Emoji_Text_Classification/test.csv")

In [4]:
def label_to_emoji(label):
    emojies = ["‚ù§Ô∏è","üèê","üòÜ","üòî","üçΩÔ∏è"]
    return emojies[label]

In [5]:
index = 10
print(x_train[index],label_to_emoji(y_train[index]))

she did not answer my text  üòî


In [6]:
def calc_max_len(x_train,x_test):
    max_len_xtrain = max([len(i.split(" ")) for i in x_train])
    max_len_xtest = max([len(i.split(" ")) for i in x_test])
    max_len = max(max_len_xtrain,max_len_xtest)
    return max_len

In [7]:
y_train_oh = to_categorical(y_train,5)
y_test_oh = to_categorical(y_test,5)

In [8]:
with open("glove.6B.50d.txt", encoding="utf8") as text:
    word_to_vec = dict()
    for line in text:
        line = line.split()
        words = line[0]
        vecs = line[1:]
        vecs = np.array(vecs,dtype=np.float64)
        word_to_vec[words] = vecs

In [9]:
def convert_to_embedding(x):
    vec_size = 50
    max_len = calc_max_len(x_train,x_test)
    embedd_matrix = np.zeros((x.shape[0],max_len,vec_size))
    for i in range(x.shape[0]):
        word = x[i].lower().split()
        for j in range(len(word)):
            embedd_matrix[i,j,:] = word_to_vec[word[j]]
    
    return embedd_matrix

In [10]:
x_train_embedd = convert_to_embedding(x_train)
x_test_embedd = convert_to_embedding(x_test)

In [11]:
print(x_train_embedd.shape)
print(y_train_oh.shape)

(132, 10, 50)
(132, 5)


# RNN 
## GRU Model

In [12]:
class MyModel(Model):
    def __init__(self):
        super().__init__()
        self.gru1 = GRU(512, return_sequences=True)
        self.gru2 = GRU(512, return_sequences=True)
        self.gru3 = GRU(512)
        self.dropout = Dropout(0.5)
        self.fc = Dense(5,activation="softmax")

    def call(self,x):
        x = self.gru1(x)
        x = self.gru2(x)
        x = self.gru3(x)
        x = self.dropout(x)
        x = self.fc(x)

        return x

In [13]:
model = MyModel()
model.compile(optimizer=Adam(learning_rate=0.0001),loss="categorical_crossentropy",metrics=["accuracy"])

In [14]:
history = model.fit(x_train_embedd,y_train_oh,
         batch_size=8,
          epochs=100,
         validation_data=(x_test_embedd,y_test_oh))

Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100
Epoch 10/100
Epoch 11/100
Epoch 12/100
Epoch 13/100
Epoch 14/100
Epoch 15/100
Epoch 16/100
Epoch 17/100
Epoch 18/100
Epoch 19/100
Epoch 20/100
Epoch 21/100
Epoch 22/100
Epoch 23/100
Epoch 24/100
Epoch 25/100
Epoch 26/100
Epoch 27/100
Epoch 28/100
Epoch 29/100
Epoch 30/100
Epoch 31/100
Epoch 32/100
Epoch 33/100
Epoch 34/100
Epoch 35/100
Epoch 36/100
Epoch 37/100
Epoch 38/100
Epoch 39/100
Epoch 40/100
Epoch 41/100
Epoch 42/100
Epoch 43/100
Epoch 44/100
Epoch 45/100
Epoch 46/100
Epoch 47/100
Epoch 48/100
Epoch 49/100
Epoch 50/100
Epoch 51/100
Epoch 52/100
Epoch 53/100
Epoch 54/100
Epoch 55/100
Epoch 56/100
Epoch 57/100
Epoch 58/100


Epoch 59/100
Epoch 60/100
Epoch 61/100
Epoch 62/100
Epoch 63/100
Epoch 64/100
Epoch 65/100
Epoch 66/100
Epoch 67/100
Epoch 68/100
Epoch 69/100
Epoch 70/100
Epoch 71/100
Epoch 72/100
Epoch 73/100
Epoch 74/100
Epoch 75/100
Epoch 76/100
Epoch 77/100
Epoch 78/100
Epoch 79/100
Epoch 80/100
Epoch 81/100
Epoch 82/100
Epoch 83/100
Epoch 84/100
Epoch 85/100
Epoch 86/100
Epoch 87/100
Epoch 88/100
Epoch 89/100
Epoch 90/100
Epoch 91/100
Epoch 92/100
Epoch 93/100
Epoch 94/100
Epoch 95/100
Epoch 96/100
Epoch 97/100
Epoch 98/100
Epoch 99/100
Epoch 100/100


In [16]:
x_example = np.array(["not sad", "i adore you", "i love you", "funny lol", "lets play with a ball", "food is ready", "not feeling happy"])
y_example = np.array([[2],[0],[0],[2],[1],[4],[3]])
x_example_embedd = convert_to_embedding(x_example)
pred = model.predict(x_example_embedd)
for i in range(x_example.shape[0]):
    print(x_example[i], label_to_emoji(np.argmax(pred[i])))

not sad üòî
i adore you ‚ù§Ô∏è
i love you ‚ù§Ô∏è
funny lol üòÜ
lets play with a ball üèê
food is ready üçΩÔ∏è
not feeling happy üòî
