In [1]:
%load_ext autoreload
%autoreload 2

# Experiments with iTALSs model

In [2]:
from pathlib import Path

import src.io as io
import src.evaluation as evaluation
import src.evaluation.splits
import src.evaluation.cars

from src.algorithm.cars.itals import iTALSs

## Datasets

In [3]:
## Uncomment corresponding directory.
## RETARGET True for Frappe, False for the others

# DATA_DIR, RETARGET = Path('../../../data/CARS/Mobile_Frappe/'), True
# DATA_DIR, RETARGET = Path('../../../data/CARS/Food_com/'), False
DATA_DIR, RETARGET = Path('../../../data/CARS/TripAdvisor/'), False

In [4]:
# Shouldn't need to change this info
INTERACTIONS = DATA_DIR / 'interactions.csv'

SEED = 123456
SEED2 = 78910

ITEM_ID = 'item'
USER_ID = 'user'

## Define algorithm and hyperparameter ranges

In [5]:
ALG = iTALSs


K = [80]
MAX_IT = [10]
DEFAULT_CONTEXT_1 = [True]

# L2 = [100, 1000, 10000, 100000]
# V = [0, 0.5, 1]
# ALPHA = [100, 1000, 10000, 100000]

L2 = [5000, 10000, 15000, 20000, 50000]
V = [0.75, 1]
ALPHA = [500, 1000, 1500, 2000, 5000]

HYPERPARAMS = {'k': K, 'l2': L2, 'v': V, 'alpha': ALPHA, 'max_iterations': MAX_IT, 'default_context_1': DEFAULT_CONTEXT_1}
HYPERPARAMS

{'k': [80],
 'l2': [5000, 10000, 15000, 20000, 50000],
 'v': [0.75, 1],
 'alpha': [500, 1000, 1500, 2000, 5000],
 'max_iterations': [10],
 'default_context_1': [True]}

## Parse data

In [6]:
data = io.parse_interactions_with_context(INTERACTIONS, item_id=ITEM_ID, user_id=USER_ID)
data.df

Unnamed: 0,userId,itemId,TripType,UserState
0,1899,1865,1,1
1,466,721,1,1
2,1992,451,2,1
3,466,1016,1,1
4,1441,414,3,1
...,...,...,...,...
12831,936,341,3,78
12832,1545,1936,3,78
12833,399,1556,2,79
12834,918,1380,5,79


## Make train/val split for hyperparam tuning

In [7]:
train, test = evaluation.splits.context_leave_one_out_split(data, seed=SEED)

## Perform gridsearch on validation set

In [8]:
%%time
score, best_hyperparams = evaluation.cars.gridsearch(ALG, train, test, HYPERPARAMS, retarget=RETARGET)
f"Best score of {score} achieved with {best_hyperparams}."

  0%|          | 0/50 [00:00<?, ?it/s]

Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024
MRR@20 0.03
Average Recall@5 0.044
Average Recall@20 0.11
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.067
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.023
MRR@20 0.029
Average Recall@5 0.043
Average Recall@20 0.103
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.009
MRR@20 0.014
Average Recall@5 0.015
Average Recall@20 0.072
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.022
MRR@20 0.027
Average Recall@5 0.039
Average Recall@20 0.097
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.025
MRR@20 0.031
Average Recall@5 0.046
Average Recall@20 0.108
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.009
MRR@20 0.014
Average Recall@5 0.015
Average Recall@20 0.072
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.021
MRR@20 0.025
Average Recall@5 0.039
Average Recall@20 0.08
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024
MRR@20 0.03
Average Recall@5 0.046
Average Recall@20 0.108
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.018
MRR@20 0.023
Average Recall@5 0.033
Average Recall@20 0.089
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.009
MRR@20 0.014
Average Recall@5 0.015
Average Recall@20 0.073
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.02
MRR@20 0.024
Average Recall@5 0.035
Average Recall@20 0.08
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.023
MRR@20 0.03
Average Recall@5 0.041
Average Recall@20 0.109
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 0.75, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024
MRR@20 0.03
Average Recall@5 0.045
Average Recall@20 0.108
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.009
MRR@20 0.015
Average Recall@5 0.017
Average Recall@20 0.074
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.019
MRR@20 0.023
Average Recall@5 0.032
Average Recall@20 0.078
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.022
MRR@20 0.027
Average Recall@5 0.039
Average Recall@20 0.095
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 1, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024
MRR@20 0.03
Average Recall@5 0.046
Average Recall@20 0.11
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.021
MRR@20 0.027
Average Recall@5 0.039
Average Recall@20 0.106
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 1500, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.018
MRR@20 0.022
Average Recall@5 0.032
Average Recall@20 0.081
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.021
MRR@20 0.027
Average Recall@5 0.039
Average Recall@20 0.097
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024
MRR@20 0.03
Average Recall@5 0.044
Average Recall@20 0.106
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.017
MRR@20 0.023
Average Recall@5 0.033
Average Recall@20 0.097
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.015
Average Recall@5 0.018
Average Recall@20 0.064
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.017
MRR@20 0.021
Average Recall@5 0.03
Average Recall@20 0.073
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.022
MRR@20 0.027
Average Recall@5 0.039
Average Recall@20 0.093
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.023
MRR@20 0.029
Average Recall@5 0.041
Average Recall@20 0.105
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.024
MRR@20 0.03
Average Recall@5 0.045
Average Recall@20 0.111
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 2000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.018
Average Recall@20 0.063
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.016
MRR@20 0.02
Average Recall@5 0.031
Average Recall@20 0.072
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.017
MRR@20 0.022
Average Recall@5 0.034
Average Recall@20 0.081
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.021
MRR@20 0.026
Average Recall@5 0.036
Average Recall@20 0.093
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.023
MRR@20 0.028
Average Recall@5 0.041
Average Recall@20 0.101
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 0.75, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.012
MRR@20 0.017
Average Recall@5 0.019
Average Recall@20 0.078
Training model iTALSs with hyperparameters {'k': 80, 'l2': 5000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.015
MRR@20 0.019
Average Recall@5 0.028
Average Recall@20 0.071
Training model iTALSs with hyperparameters {'k': 80, 'l2': 10000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.018
MRR@20 0.022
Average Recall@5 0.032
Average Recall@20 0.081
Training model iTALSs with hyperparameters {'k': 80, 'l2': 15000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.02
MRR@20 0.024
Average Recall@5 0.037
Average Recall@20 0.084
Training model iTALSs with hyperparameters {'k': 80, 'l2': 20000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.022
MRR@20 0.027
Average Recall@5 0.039
Average Recall@20 0.092
Training model iTALSs with hyperparameters {'k': 80, 'l2': 50000, 'v': 1, 'alpha': 5000, 'max_iterations': 10, 'default_context_1': True}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.023
MRR@20 0.03
Average Recall@5 0.046
Average Recall@20 0.112
CPU times: user 9min 27s, sys: 2min 9s, total: 11min 37s
Wall time: 18min 57s


"Best score of 0.03080935839706022 achieved with {'k': 80, 'l2': 10000, 'v': 0.75, 'alpha': 1000, 'max_iterations': 10, 'default_context_1': True}."

## Evaluate model with optimal hyperparams with KFolds Cross validation

In [9]:
%%time
alg = ALG(**best_hyperparams)
results = evaluation.cars.contextKFoldsEval(alg, data, nr_folds=5, seed=SEED2, retarget=RETARGET)

  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 2362 users
MRR@5 0.023 (0.002)
MRR@20 0.029 (0.001)
Average Recall@5 0.041 (0.003)
Average Recall@20 0.104 (0.001)
CPU times: user 57.3 s, sys: 13 s, total: 1min 10s
Wall time: 1min 56s
