In [1]:
%load_ext autoreload
%autoreload 2

# Experiments with WTF model

In [2]:
from pathlib import Path

import src.io as io
import src.evaluation as evaluation
import src.evaluation.splits
import src.evaluation.cars

from src.algorithm.cars.wtf import WTF

## Datasets

In [3]:
## Uncomment corresponding directory.
## RETARGET True for Frappe, False for the others

# DATA_DIR, RETARGET = Path('../../../data/CARS/Mobile_Frappe/'), True
DATA_DIR, RETARGET = Path('../../../data/CARS/Food_com/'), False
# DATA_DIR, RETARGET = Path('../../../data/CARS/TripAdvisor/'), False

In [4]:
# Shouldn't need to change this info
INTERACTIONS = DATA_DIR / 'interactions.csv'

SEED = 123456
SEED2 = 78910

ITEM_ID = 'item'
USER_ID = 'user'

## Define algorithm and hyperparameter ranges

In [5]:
ALG = WTF

K = [160]


# K = [80]
MAX_IT = [10]
DEFAULT_CONTEXT_1 = [True]
MAX_CG_IT = [10]

L2 = [100, 1000, 10000, 100000]
V = [0, 0.5, 1]
ALPHA = [100, 1000, 10000, 100000]

# L2 = [5000, 10000, 20000, 50000]
# V = [0.25, 0.5, 0.75]
# ALPHA = [500, 1000, 2000, 5000]

# L2 = [100, 500, 1000, 2000]
# V = [0.75, 1]
# ALPHA = [1, 10, 50, 100, 200]

HYPERPARAMS = {'k': K, 'l2': L2, 'v': V, 'alpha': ALPHA, 'max_iterations': MAX_IT, 'default_context_1': DEFAULT_CONTEXT_1, 'max_cg_iter': MAX_CG_IT}
HYPERPARAMS

{'k': [160],
 'l2': [100, 1000, 10000, 100000],
 'v': [0, 0.5, 1],
 'alpha': [100, 1000, 10000, 100000],
 'max_iterations': [10],
 'default_context_1': [True],
 'max_cg_iter': [10]}

## Parse data

In [6]:
data = io.parse_interactions_with_context(INTERACTIONS, item_id=ITEM_ID, user_id=USER_ID)
data.df

Unnamed: 0,userId,itemId,TripType,UserState
0,1899,1865,1,1
1,466,721,1,1
2,1992,451,2,1
3,466,1016,1,1
4,1441,414,3,1
...,...,...,...,...
12831,936,341,3,78
12832,1545,1936,3,78
12833,399,1556,2,79
12834,918,1380,5,79


## Make train/val split for hyperparam tuning

In [7]:
train, test = evaluation.splits.context_leave_one_out_split(data, seed=SEED)

## Perform gridsearch on validation set

In [8]:
%%time
score, best_hyperparams = evaluation.cars.gridsearch(ALG, train, test, HYPERPARAMS, retarget=RETARGET)
f"Best score of {score} achieved with {best_hyperparams}."

  0%|          | 0/48 [00:00<?, ?it/s]

Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 0, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.022
MRR@20 0.027
Average Recall@5 0.041
Average Recall@20 0.097
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 0, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.017
MRR@20 0.023
Average Recall@5 0.033
Average Recall@20 0.093
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 0, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 0, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 0.5, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024
MRR@20 0.031
Average Recall@5 0.043
Average Recall@20 0.111
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 0.5, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024
MRR@20 0.03
Average Recall@5 0.046
Average Recall@20 0.105
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 0.5, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 0.5, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.068
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 1, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.018
MRR@20 0.024
Average Recall@5 0.034
Average Recall@20 0.091
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 1, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.022
MRR@20 0.027
Average Recall@5 0.035
Average Recall@20 0.092
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 1, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 1, 'alpha': 100, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 0, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.009
MRR@20 0.013
Average Recall@5 0.017
Average Recall@20 0.056
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 0, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.018
MRR@20 0.024
Average Recall@5 0.033
Average Recall@20 0.099
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 0, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.013
MRR@20 0.019
Average Recall@5 0.025
Average Recall@20 0.086
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 0, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 0.5, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.013
MRR@20 0.017
Average Recall@5 0.024
Average Recall@20 0.064
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 0.5, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.018
MRR@20 0.024
Average Recall@5 0.033
Average Recall@20 0.098
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 0.5, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.013
MRR@20 0.018
Average Recall@5 0.025
Average Recall@20 0.083
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 0.5, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.013
MRR@20 0.017
Average Recall@5 0.029
Average Recall@20 0.067
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.015
MRR@20 0.018
Average Recall@5 0.029
Average Recall@20 0.063
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.026
MRR@20 0.032
Average Recall@5 0.047
Average Recall@20 0.113
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 0, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.008
MRR@20 0.011
Average Recall@5 0.016
Average Recall@20 0.041
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 0, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.005
MRR@20 0.008
Average Recall@5 0.013
Average Recall@20 0.041
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 0, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.012
MRR@20 0.017
Average Recall@5 0.021
Average Recall@20 0.079
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 0, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.011
MRR@20 0.015
Average Recall@5 0.019
Average Recall@20 0.066
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 0.5, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.006
MRR@20 0.009
Average Recall@5 0.012
Average Recall@20 0.042
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 0.5, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.006
MRR@20 0.009
Average Recall@5 0.013
Average Recall@20 0.041
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 0.5, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.016
MRR@20 0.023
Average Recall@5 0.033
Average Recall@20 0.102
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 0.5, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.015
Average Recall@20 0.065
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 1, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.006
MRR@20 0.008
Average Recall@5 0.012
Average Recall@20 0.037
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 1, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.007
MRR@20 0.009
Average Recall@5 0.015
Average Recall@20 0.041
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 1, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.016
MRR@20 0.02
Average Recall@5 0.032
Average Recall@20 0.077
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 1, 'alpha': 10000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.02
Average Recall@20 0.069
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 0, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.008
MRR@20 0.01
Average Recall@5 0.018
Average Recall@20 0.043
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 0, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.006
MRR@20 0.008
Average Recall@5 0.014
Average Recall@20 0.039
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 0, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.005
MRR@20 0.008
Average Recall@5 0.012
Average Recall@20 0.038
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 0, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.008
MRR@20 0.012
Average Recall@5 0.018
Average Recall@20 0.066
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 0.5, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.007
MRR@20 0.009
Average Recall@5 0.016
Average Recall@20 0.045
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 0.5, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.004
MRR@20 0.006
Average Recall@5 0.011
Average Recall@20 0.032
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 0.5, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.007
MRR@20 0.01
Average Recall@5 0.016
Average Recall@20 0.047
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 0.5, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.014
MRR@20 0.02
Average Recall@5 0.026
Average Recall@20 0.087
Training model WTF with hyperparameters {'k': 160, 'l2': 100, 'v': 1, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.006
MRR@20 0.009
Average Recall@5 0.013
Average Recall@20 0.042
Training model WTF with hyperparameters {'k': 160, 'l2': 1000, 'v': 1, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.004
MRR@20 0.007
Average Recall@5 0.011
Average Recall@20 0.036
Training model WTF with hyperparameters {'k': 160, 'l2': 10000, 'v': 1, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.013
Average Recall@5 0.021
Average Recall@20 0.05
Training model WTF with hyperparameters {'k': 160, 'l2': 100000, 'v': 1, 'alpha': 100000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.021
MRR@20 0.027
Average Recall@5 0.041
Average Recall@20 0.108
CPU times: user 9min 16s, sys: 3min 46s, total: 13min 2s
Wall time: 25min 42s


"Best score of 0.03192388360587832 achieved with {'k': 160, 'l2': 10000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True, 'max_cg_iter': 10}."

## Evaluate model with optimal hyperparams with KFolds Cross validation

In [9]:
%%time
alg = ALG(**best_hyperparams)
results = evaluation.cars.contextKFoldsEval(alg, data, nr_folds=5, seed=SEED2, retarget=RETARGET)

  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024 (0.003)
MRR@20 0.03 (0.003)
Average Recall@5 0.045 (0.004)
Average Recall@20 0.108 (0.004)
CPU times: user 57.8 s, sys: 23.5 s, total: 1min 21s
Wall time: 2min 42s
