From the dataset we observe a few things:
- This is a multilabel image classification problem
    - one or two possible types per image, so not multiclass
- We could make this multiclass if we consider combination types as their own class
    - not sure tho
- there is a class imbalance, far more normal and water types. And ice types are a fifth the size of the largest class
- This [guide](https://www.analyticsvidhya.com/blog/2019/04/build-first-multi-label-image-classification-model-python/) will help

Notes:
- one model for each type, which will give a probablity score for each class
- the top two classes for each image will be the predicted types
    - the second type will have to be above a certain threshold else one type is predicted
    - Our class probabilities are independent of each other

In [28]:
import keras
from keras.models import Sequential
from keras.layers import Dense, Dropout, Flatten
from keras.layers import Conv2D, MaxPooling2D
from tensorflow.keras.utils import to_categorical
from keras.preprocessing import image
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
from tqdm import tqdm
%matplotlib inline

In [29]:
import tensorflow as tf
gpus = tf.config.list_physical_devices('GPU')
gpus

[PhysicalDevice(name='/physical_device:GPU:0', device_type='GPU')]

In [30]:
train = pd.read_csv('image_tagging/train.csv', nrows=20000) # set limit, delete "nrows" to undo
train.head()

Unnamed: 0,Key,Type,Name,normal,fire,water,grass,electric,ice,fighting,...,ground,flying,psychic,bug,rock,ghost,dragon,dark,steel,fairy
0,110.95,"poison, ground",Weezing/Onix,0,0,0,0,0,0,0,...,1,0,0,0,0,0,0,0,0,0
1,155.408,"fire, fairy",Cyndaquil/Cottonee,0,1,0,0,0,0,0,...,0,0,0,0,0,0,0,0,0,1
2,360.381,"grass, psychic",Whimsicott/Jirachi,0,0,0,1,0,0,0,...,0,0,1,0,0,0,0,0,0,0
3,6.142e,"fire, flying",Charizard/Aerodactyl,0,1,0,0,0,0,0,...,0,1,0,0,0,0,0,0,0,0
4,289.175,"bug, fairy",Shedinja/Togepi,0,0,0,0,0,0,0,...,0,0,0,1,0,0,0,0,0,1


In [31]:
train.columns

Index(['Key', 'Type', 'Name', 'normal', 'fire', 'water', 'grass', 'electric',
       'ice', 'fighting', 'poison', 'ground', 'flying', 'psychic', 'bug',
       'rock', 'ghost', 'dragon', 'dark', 'steel', 'fairy'],
      dtype='object')

In [None]:
TRAINING_DATASET = "/blue/rcstudents/smaley/pokegan/customsprites/blk_bg/input"
IMAGE_SIZE = (256,256,3)

train_image = []
for i in tqdm(range(train.shape[0])):
    # we want them to be 256x256 images 
    img = image.load_img(f"{TRAINING_DATASET}/{train.at[i, 'Key']}.png",target_size=IMAGE_SIZE)
    img = image.img_to_array(img)
    img = img/255
    train_image.append(img)
X = np.array(train_image)

 99%|█████████▉| 19875/20000 [00:41<00:00, 186.94it/s]

In [None]:
X.shape

In [None]:
plt.imshow(X[2])

In [None]:
train['Type'][2]

In [None]:
y = np.array(train.drop(['Key', 'Type', 'Name'],axis=1))
y.shape

In [None]:
X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=42, test_size=0.1)

In [None]:
model = Sequential()
model.add(Conv2D(filters=16, kernel_size=(5, 5), activation="relu", input_shape=IMAGE_SIZE))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))
model.add(Conv2D(filters=32, kernel_size=(5, 5), activation='relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))
model.add(Conv2D(filters=64, kernel_size=(5, 5), activation="relu"))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))
model.add(Conv2D(filters=64, kernel_size=(5, 5), activation='relu'))
model.add(MaxPooling2D(pool_size=(2, 2)))
model.add(Dropout(0.25))
model.add(Flatten())
model.add(Dense(128, activation='relu'))
model.add(Dropout(0.5))
model.add(Dense(64, activation='relu'))
model.add(Dropout(0.5))
model.add(Dense(18, activation='sigmoid')) # make equal to num classes

In [None]:
model.summary()

In [None]:
model.compile(optimizer='adam', loss='binary_crossentropy', metrics=['accuracy'])

In [None]:
model.fit(X_train, y_train, epochs=10, validation_data=(X_test, y_test), batch_size=64)

In [None]:
img = image.load_img(f"{TRAINING_DATASET}/338.287i.png",target_size=IMAGE_SIZE)
img = image.img_to_array(img)
img = img/255

In [None]:
classes = np.array(train.columns[2:])
proba = model.predict(img.reshape(1,256,256,3))
top_3 = np.argsort(proba[0])[:-4:-1]
for i in range(3):
    print("{}".format(classes[top_3[i]])+" ({:.3})".format(proba[0][top_3[i]]))
plt.imshow(img)