In [21]:
import tensorflow as tf
import numpy as np
import pandas as pd
from collections import Counter
from sklearn.model_selection import train_test_split
from sklearn.metrics import accuracy_score


def move_accuracy(y_test, y_pred):
    """A predicted move is correct if the largest output is 1 in the test vector."""
    return np.mean(y_test[y_pred == np.max(y_pred, axis=1, keepdims=True)])

np.random.seed(1234)

df = pd.read_csv ("tictactoe-data.csv")

print(Counter(df["score"]))

# For design matrix select only columns 0-18, without 18 and include last two columns:

Xdes = df.iloc[:,list(range(18))+[-2]]

print(Xdes.shape)

moves = df.iloc[:, 18:27]

X_train, X_test, y_train, y_test = train_test_split(Xdes, moves, test_size=0.2)

# First number is No. of neurons, next is activation function, and number of inputs
# Each line is a new layer, first one is input, two hidden and one output

model = tf.keras.Sequential()
model.add(tf.keras.layers.Dense(128, activation="relu", input_dim=Xdes.shape[1]))

# Avoid overfitting, randomly switch off 30% neurons with dropout layers:

#model.add(tf.keras.layers.Dropout(0.2))
#model.add(tf.keras.layers.Dense(64, activation="relu"))
model.add(tf.keras.layers.Dropout(0.2))
model.add(tf.keras.layers.Dense(32, activation="relu"))
model.add(tf.keras.layers.Dense(moves.shape[1], activation="softmax"))
          
# Define the cost/loss function, this loss function is good for multiple options          
model.compile(optimizer="adam", loss="categorical_crossentropy", metrics=["accuracy"])

# Train your model
          
model.fit(
    X_train,
    y_train,
    epochs=100,
    batch_size=16,
    validation_data=[X_test, y_test])

model.save("tictacNet.h5")
print ("Custom accuracy:", move_accuracy(y_test.values, model.predict(X_test)))

Counter({1: 2310, -1: 1158, 0: 1052})
(4520, 19)
Train on 3616 samples, validate on 904 samples
Epoch 1/100
Epoch 2/100
Epoch 3/100
Epoch 4/100
Epoch 5/100
Epoch 6/100
Epoch 7/100
Epoch 8/100
Epoch 9/100


KeyboardInterrupt: 