In [1]:
%load_ext autoreload
%autoreload 2

# Experiments with iTALS model

In [2]:
from pathlib import Path

import src.io as io
import src.evaluation as evaluation
import src.evaluation.splits
import src.evaluation.cars

from src.algorithm.cars.itals import iTALS

## Datasets

In [3]:
## Uncomment corresponding directory.
## RETARGET True for Frappe, False for the others

# DATA_DIR, RETARGET = Path('../../../data/CARS/Mobile_Frappe/'), True
DATA_DIR, RETARGET = Path('../../../data/CARS/Food_com/'), False
# DATA_DIR, RETARGET = Path('../../../data/CARS/TripAdvisor/'), False

In [4]:
# Shouldn't need to change this info
INTERACTIONS = DATA_DIR / 'interactions.csv'

SEED = 123456
SEED2 = 78910

ITEM_ID = 'item'
USER_ID = 'user'

## Define algorithm and hyperparameter ranges

In [5]:
ALG = iTALS


K = [160]

# K = [80]
MAX_IT = [10]
DEFAULT_CONTEXT_1 = [True]

L2 = [100, 1000, 10000, 100000]
V = [0, 0.5, 1]
ALPHA = [100, 1000, 10000, 100000]

# L2 = [50000, 100000, 500000, 1000000]
# V = [0.75, 1]
# ALPHA = [5000, 10000, 20000, 50000]

HYPERPARAMS = {'k': K, 'l2': L2, 'v': V, 'alpha': ALPHA, 'max_iterations': MAX_IT, 'default_context_1': DEFAULT_CONTEXT_1}
HYPERPARAMS

{'k': [80],
 'l2': [5000, 10000, 20000, 50000],
 'v': [0.75, 1],
 'alpha': [500, 1000, 2000, 5000],
 'max_iterations': [10],
 'default_context_1': [True]}

## Parse data

In [6]:
data = io.parse_interactions_with_context(INTERACTIONS, item_id=ITEM_ID, user_id=USER_ID)
data.df

Unnamed: 0,userId,itemId,daytime,weather,weekday
0,0,0,1,1,1
1,1,1,2,2,2
2,2,2,3,2,3
3,3,3,4,0,4
4,4,4,5,1,4
...,...,...,...,...,...
95997,109,0,3,1,1
95998,37,16,4,2,1
95999,180,33,2,2,1
96000,445,751,3,1,1


## Make train/val split for hyperparam tuning

In [7]:
train, test = evaluation.splits.context_leave_one_out_split(data, seed=SEED)

## Perform gridsearch on validation set

In [8]:
%%time
score, best_hyperparams = evaluation.cars.gridsearch(ALG, train, test, HYPERPARAMS, retarget=RETARGET)
f"Best score of {score} achieved with {best_hyperparams}."

  0%|          | 0/32 [00:00<?, ?it/s]

Training model iTALS with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.272
MRR@20 0.292
Average Recall@5 0.449
Average Recall@20 0.642
Training model iTALS with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.247
MRR@20 0.268
Average Recall@5 0.384
Average Recall@20 0.572
Training model iTALS with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.201
MRR@20 0.22
Average Recall@5 0.311
Average Recall@20 0.5
Training model iTALS with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.128
MRR@20 0.145
Average Recall@5 0.241
Average Recall@20 0.402
Training model iTALS with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.277
MRR@20 0.299
Average Recall@5 0.453
Average Recall@20 0.652
Training model iTALS with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.269
MRR@20 0.29
Average Recall@5 0.441
Average Recall@20 0.64
Training model iTALS with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.247
MRR@20 0.267
Average Recall@5 0.381
Average Recall@20 0.571
Training model iTALS with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.198
MRR@20 0.216
Average Recall@5 0.312
Average Recall@20 0.493
Training model iTALS with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.272
MRR@20 0.295
Average Recall@5 0.449
Average Recall@20 0.654
Training model iTALS with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.265
MRR@20 0.287
Average Recall@5 0.42
Average Recall@20 0.629
Training model iTALS with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.224
MRR@20 0.246
Average Recall@5 0.342
Average Recall@20 0.547
Training model iTALS with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.126
MRR@20 0.143
Average Recall@5 0.26
Average Recall@20 0.439
Training model iTALS with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.278
MRR@20 0.3
Average Recall@5 0.464
Average Recall@20 0.667
Training model iTALS with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.275
MRR@20 0.296
Average Recall@5 0.457
Average Recall@20 0.652
Training model iTALS with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.262
MRR@20 0.286
Average Recall@5 0.401
Average Recall@20 0.621
Training model iTALS with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.206
MRR@20 0.226
Average Recall@5 0.325
Average Recall@20 0.511
Training model iTALS with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.266
MRR@20 0.291
Average Recall@5 0.461
Average Recall@20 0.679
Training model iTALS with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.269
MRR@20 0.292
Average Recall@5 0.451
Average Recall@20 0.659
Training model iTALS with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.24
MRR@20 0.263
Average Recall@5 0.38
Average Recall@20 0.598
Training model iTALS with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.17
MRR@20 0.19
Average Recall@5 0.284
Average Recall@20 0.473
Training model iTALS with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.28
MRR@20 0.303
Average Recall@5 0.477
Average Recall@20 0.683
Training model iTALS with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.267
MRR@20 0.29
Average Recall@5 0.463
Average Recall@20 0.681
Training model iTALS with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.269
MRR@20 0.292
Average Recall@5 0.434
Average Recall@20 0.651
Training model iTALS with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.227
MRR@20 0.248
Average Recall@5 0.354
Average Recall@20 0.551
Training model iTALS with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.259
MRR@20 0.285
Average Recall@5 0.461
Average Recall@20 0.694
Training model iTALS with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.267
MRR@20 0.293
Average Recall@5 0.456
Average Recall@20 0.695
Training model iTALS with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.245
MRR@20 0.27
Average Recall@5 0.42
Average Recall@20 0.656
Training model iTALS with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.173
MRR@20 0.196
Average Recall@5 0.306
Average Recall@20 0.532
Training model iTALS with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.264
MRR@20 0.29
Average Recall@5 0.464
Average Recall@20 0.697
Training model iTALS with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.265
MRR@20 0.29
Average Recall@5 0.462
Average Recall@20 0.691
Training model iTALS with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.256
MRR@20 0.282
Average Recall@5 0.436
Average Recall@20 0.679
Training model iTALS with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.237
MRR@20 0.259
Average Recall@5 0.398
Average Recall@20 0.612
CPU times: user 3min 24s, sys: 43.1 s, total: 4min 7s
Wall time: 10min 7s


"Best score of 0.3030041960752441 achieved with {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}."

## Evaluate model with optimal hyperparams with KFolds Cross validation

In [9]:
%%time
alg = ALG(**best_hyperparams)
results = evaluation.cars.contextKFoldsEval(alg, data, nr_folds=5, seed=SEED2, retarget=RETARGET)

  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 816 users
MRR@5 0.28 (0.009)
MRR@20 0.301 (0.007)
Average Recall@5 0.461 (0.015)
Average Recall@20 0.652 (0.01)
CPU times: user 34.1 s, sys: 6.92 s, total: 41.1 s
Wall time: 1min 42s
