In [1]:
%load_ext autoreload
%autoreload 2

# Experiments with WTF model

In [2]:
from pathlib import Path

import src.io as io
import src.evaluation as evaluation
import src.evaluation.splits
import src.evaluation.cars

from src.algorithm.cars.wtf import WTF

## Datasets

In [3]:
## Uncomment corresponding directory.
## RETARGET True for Frappe, False for the others

DATA_DIR, RETARGET = Path('../../../data/CARS/Mobile_Frappe/'), True
# DATA_DIR, RETARGET = Path('../../../data/CARS/Food_com/'), False
# DATA_DIR, RETARGET = Path('../../../data/CARS/TripAdvisor/'), False

In [4]:
# Shouldn't need to change this info
INTERACTIONS = DATA_DIR / 'interactions.csv'

SEED = 123456
SEED2 = 78910

ITEM_ID = 'item'
USER_ID = 'user'

## Define algorithm and hyperparameter ranges

In [5]:
ALG = WTF

K = [80]
MAX_IT = [10]
DEFAULT_CONTEXT_1 = [True]

# L2 = [100, 1000, 10000, 100000]
# V = [0, 0.5, 1]
# ALPHA = [100, 1000, 10000, 100000]

L2 = [500, 1000, 2000, 5000]
V = [0.75, 1]
ALPHA = [1, 10, 50, 100, 200]

HYPERPARAMS = {'k': K, 'l2': L2, 'v': V, 'alpha': ALPHA, 'max_iterations': MAX_IT, 'default_context_1': DEFAULT_CONTEXT_1}
HYPERPARAMS

{'k': [80],
 'l2': [500, 1000, 2000, 5000],
 'v': [0.75, 1],
 'alpha': [1, 10, 50, 100, 200],
 'max_iterations': [10],
 'default_context_1': [True]}

## Parse data

In [6]:
data = io.parse_interactions_with_context(INTERACTIONS, item_id=ITEM_ID, user_id=USER_ID)
data.df

Unnamed: 0,userId,itemId,daytime,weather,weekday
0,0,0,1,1,1
1,1,1,2,2,2
2,2,2,3,2,3
3,3,3,4,0,4
4,4,4,5,1,4
...,...,...,...,...,...
95997,109,0,3,1,1
95998,37,16,4,2,1
95999,180,33,2,2,1
96000,445,751,3,1,1


## Make train/val split for hyperparam tuning

In [7]:
train, test = evaluation.splits.context_leave_one_out_split(data, seed=SEED)

## Perform gridsearch on validation set

In [8]:
%%time
score, best_hyperparams = evaluation.cars.gridsearch(ALG, train, test, HYPERPARAMS, retarget=RETARGET)
f"Best score of {score} achieved with {best_hyperparams}."

  0%|          | 0/40 [00:00<?, ?it/s]

Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.75, 'alpha': 1, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.217
MRR@20 0.232
Average Recall@5 0.335
Average Recall@20 0.483
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.75, 'alpha': 1, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.157
MRR@20 0.17
Average Recall@5 0.271
Average Recall@20 0.403
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.75, 'alpha': 1, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.128
MRR@20 0.143
Average Recall@5 0.241
Average Recall@20 0.385
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 1, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.127
MRR@20 0.141
Average Recall@5 0.241
Average Recall@20 0.386
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 1, 'alpha': 1, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.234
MRR@20 0.25
Average Recall@5 0.364
Average Recall@20 0.513
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 1, 'alpha': 1, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.188
MRR@20 0.202
Average Recall@5 0.292
Average Recall@20 0.43
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 1, 'alpha': 1, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.128
MRR@20 0.143
Average Recall@5 0.241
Average Recall@20 0.386
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 1, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.128
MRR@20 0.142
Average Recall@5 0.243
Average Recall@20 0.387
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.75, 'alpha': 10, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.25
MRR@20 0.274
Average Recall@5 0.392
Average Recall@20 0.607
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.75, 'alpha': 10, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.213
MRR@20 0.234
Average Recall@5 0.33
Average Recall@20 0.528
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.75, 'alpha': 10, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.151
MRR@20 0.17
Average Recall@5 0.265
Average Recall@20 0.451
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 10, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.131
MRR@20 0.147
Average Recall@5 0.243
Average Recall@20 0.397
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 1, 'alpha': 10, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.267
MRR@20 0.288
Average Recall@5 0.431
Average Recall@20 0.632
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 1, 'alpha': 10, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.234
MRR@20 0.255
Average Recall@5 0.359
Average Recall@20 0.554
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 1, 'alpha': 10, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.187
MRR@20 0.206
Average Recall@5 0.299
Average Recall@20 0.479
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 10, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.116
MRR@20 0.133
Average Recall@5 0.241
Average Recall@20 0.396
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.75, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.27
MRR@20 0.293
Average Recall@5 0.46
Average Recall@20 0.676
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.75, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.24
MRR@20 0.266
Average Recall@5 0.402
Average Recall@20 0.637
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.75, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.203
MRR@20 0.225
Average Recall@5 0.335
Average Recall@20 0.55
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.131
MRR@20 0.148
Average Recall@5 0.261
Average Recall@20 0.439
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 1, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.27
MRR@20 0.295
Average Recall@5 0.457
Average Recall@20 0.685
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 1, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.259
MRR@20 0.282
Average Recall@5 0.428
Average Recall@20 0.651
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 1, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.225
MRR@20 0.249
Average Recall@5 0.362
Average Recall@20 0.586
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.168
MRR@20 0.187
Average Recall@5 0.286
Average Recall@20 0.464
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.75, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.267
MRR@20 0.292
Average Recall@5 0.464
Average Recall@20 0.69
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.75, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.251
MRR@20 0.277
Average Recall@5 0.434
Average Recall@20 0.67
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.75, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.22
MRR@20 0.244
Average Recall@5 0.364
Average Recall@20 0.605
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.162
MRR@20 0.182
Average Recall@5 0.277
Average Recall@20 0.472
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 1, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.259
MRR@20 0.283
Average Recall@5 0.471
Average Recall@20 0.701
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 1, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.254
MRR@20 0.28
Average Recall@5 0.436
Average Recall@20 0.675
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 1, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.238
MRR@20 0.262
Average Recall@5 0.4
Average Recall@20 0.616
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.174
MRR@20 0.194
Average Recall@5 0.316
Average Recall@20 0.509
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.75, 'alpha': 200, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.26
MRR@20 0.286
Average Recall@5 0.472
Average Recall@20 0.707
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.75, 'alpha': 200, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.254
MRR@20 0.28
Average Recall@5 0.451
Average Recall@20 0.7
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.75, 'alpha': 200, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.229
MRR@20 0.256
Average Recall@5 0.391
Average Recall@20 0.643
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 200, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.169
MRR@20 0.193
Average Recall@5 0.289
Average Recall@20 0.521
Training model WTF with hyperparameters {'k': 80, 'l2': 500, 'v': 1, 'alpha': 200, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.264
MRR@20 0.29
Average Recall@5 0.469
Average Recall@20 0.708
Training model WTF with hyperparameters {'k': 80, 'l2': 1000, 'v': 1, 'alpha': 200, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.251
MRR@20 0.277
Average Recall@5 0.45
Average Recall@20 0.7
Training model WTF with hyperparameters {'k': 80, 'l2': 2000, 'v': 1, 'alpha': 200, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.246
MRR@20 0.273
Average Recall@5 0.411
Average Recall@20 0.657
Training model WTF with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 200, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.205
MRR@20 0.229
Average Recall@5 0.339
Average Recall@20 0.569
CPU times: user 10min 44s, sys: 3min 58s, total: 14min 43s
Wall time: 33min 38s


"Best score of 0.2945543186529858 achieved with {'k': 80, 'l2': 500, 'v': 1, 'alpha': 50, 'max_iterations': 10, 'default_context_1': True}."

## Evaluate model with optimal hyperparams with KFolds Cross validation

In [9]:
%%time
alg = ALG(**best_hyperparams)
results = evaluation.cars.contextKFoldsEval(alg, data, nr_folds=5, seed=SEED2, retarget=RETARGET)

  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.274 (0.005)
MRR@20 0.296 (0.005)
Average Recall@5 0.45 (0.007)
Average Recall@20 0.656 (0.009)
CPU times: user 1min 18s, sys: 29.3 s, total: 1min 48s
Wall time: 4min 10s
