In [1]:
%load_ext autoreload
%autoreload 2

# Experiments with WMF model

In [2]:
from pathlib import Path

import scipy.sparse
import numpy as np

import src.io as io
import src.evaluation as evaluation
import src.evaluation.splits
import src.evaluation.base

from src.algorithm.baseline.wmf import WMF

## Datasets

In [3]:
## Uncomment corresponding directory.
## RETARGET True for Frappe, False for the others

# DATA_DIR, RETARGET = Path('../../../data/CARS/Mobile_Frappe/'), True
DATA_DIR, RETARGET = Path('../../../data/CARS/Food_com/'), False
# DATA_DIR, RETARGET = Path('../../../data/CARS/TripAdvisor/'), False

In [4]:
# Shouldn't need to change this info
INTERACTIONS = DATA_DIR / 'interactions.csv'

SEED = 123456
SEED2 = 78910

ITEM_ID = 'item'
USER_ID = 'user'

## Define algorithm and hyperparameter ranges

In [5]:
ALG = WMF


K = [80]
MAX_IT = [10]

# L2 = [100, 1000, 10000, 100000]
# V = [0, 0.5, 1]
# ALPHA = [100, 1000, 10000, 100000]

L2 = [500, 1000, 1500, 2000, 5000]
V = [0, 0.25]
ALPHA = [1, 20, 50, 100, 200, 500]

HYPERPARAMS = {'k': K, 'l2': L2, 'v': V, 'alpha': ALPHA, 'max_iterations': MAX_IT}

HYPERPARAMS

{'k': [80],
 'l2': [500, 1000, 1500, 2000, 5000],
 'v': [0, 0.25],
 'alpha': [1, 20, 50, 100, 200, 500],
 'max_iterations': [10]}

## Parse data

In [6]:
data = io.parse_interactions_with_context(INTERACTIONS, item_id=ITEM_ID, user_id=USER_ID)
data.df

Unnamed: 0,userId,itemId,season,weekday
0,19211,6280,1,1
1,17684,6280,2,2
2,12110,6280,3,3
3,7184,6280,3,1
4,17837,6280,2,4
...,...,...,...,...
388357,895,7799,3,7
388358,4100,7799,4,2
388359,2940,7799,1,4
388360,757,7799,2,2


## Make train/val split for hyperparam tuning

In [7]:
Xtrain, Xval_in, Xval_out = evaluation.splits.leave_one_out_split_non_context(data, seed=SEED)

## Perform gridsearch on validation set

In [8]:
%%time
score, best_hyperparams = evaluation.base.gridsearch(ALG, Xtrain, Xval_in, Xval_out, HYPERPARAMS, retarget=RETARGET)
f"Best score of {score} achieved with {best_hyperparams}."

  0%|          | 0/60 [00:00<?, ?it/s]

Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.25, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.25, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0.25, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.25, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.25, 'alpha': 1, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.054
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.013
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.25, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.25, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.013
Average Recall@5 0.021
Average Recall@20 0.054
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0.25, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.018
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.25, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.018
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.25, 'alpha': 20, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.018
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.014
MRR@20 0.018
Average Recall@5 0.026
Average Recall@20 0.062
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.02
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.25, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.014
MRR@20 0.017
Average Recall@5 0.025
Average Recall@20 0.063
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.25, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0.25, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.25, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.25, 'alpha': 50, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.009
MRR@20 0.012
Average Recall@5 0.018
Average Recall@20 0.053
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.014
MRR@20 0.017
Average Recall@5 0.024
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.014
MRR@20 0.017
Average Recall@5 0.026
Average Recall@20 0.062
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.015
Average Recall@5 0.022
Average Recall@20 0.057
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.25, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.015
MRR@20 0.018
Average Recall@5 0.025
Average Recall@20 0.058
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.25, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.013
MRR@20 0.017
Average Recall@5 0.025
Average Recall@20 0.062
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0.25, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.015
Average Recall@5 0.022
Average Recall@20 0.058
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.25, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.25, 'alpha': 100, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.013
Average Recall@5 0.021
Average Recall@20 0.054
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.012
MRR@20 0.015
Average Recall@5 0.02
Average Recall@20 0.049
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.015
MRR@20 0.018
Average Recall@5 0.026
Average Recall@20 0.062
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.016
MRR@20 0.019
Average Recall@5 0.028
Average Recall@20 0.065
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.012
MRR@20 0.016
Average Recall@5 0.022
Average Recall@20 0.058
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.25, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.013
MRR@20 0.015
Average Recall@5 0.022
Average Recall@20 0.049
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.25, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.016
MRR@20 0.019
Average Recall@5 0.027
Average Recall@20 0.065
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0.25, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.015
MRR@20 0.018
Average Recall@5 0.027
Average Recall@20 0.064
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.25, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.015
Average Recall@5 0.022
Average Recall@20 0.057
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.25, 'alpha': 200, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.014
Average Recall@5 0.019
Average Recall@20 0.056
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.01
MRR@20 0.013
Average Recall@5 0.018
Average Recall@20 0.044
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.012
MRR@20 0.015
Average Recall@5 0.02
Average Recall@20 0.051
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.014
MRR@20 0.017
Average Recall@5 0.024
Average Recall@20 0.057
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.016
MRR@20 0.019
Average Recall@5 0.027
Average Recall@20 0.063
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.014
Average Recall@5 0.021
Average Recall@20 0.057
Training model WMF with hyperparameters {'k': 80, 'l2': 500, 'v': 0.25, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.013
Average Recall@5 0.018
Average Recall@20 0.044
Training model WMF with hyperparameters {'k': 80, 'l2': 1000, 'v': 0.25, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.013
MRR@20 0.016
Average Recall@5 0.022
Average Recall@20 0.054
Training model WMF with hyperparameters {'k': 80, 'l2': 1500, 'v': 0.25, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.013
MRR@20 0.017
Average Recall@5 0.024
Average Recall@20 0.059
Training model WMF with hyperparameters {'k': 80, 'l2': 2000, 'v': 0.25, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.015
MRR@20 0.019
Average Recall@5 0.027
Average Recall@20 0.066
Training model WMF with hyperparameters {'k': 80, 'l2': 5000, 'v': 0.25, 'alpha': 500, 'max_iterations': 10}


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.011
MRR@20 0.014
Average Recall@5 0.022
Average Recall@20 0.057
CPU times: user 36min 28s, sys: 5min 36s, total: 42min 5s
Wall time: 1h 5min 39s


"Best score of 0.019411480887727674 achieved with {'k': 80, 'l2': 1000, 'v': 0.25, 'alpha': 200, 'max_iterations': 10}."

## Evaluate model with optimal hyperparams with KFolds Cross validation

In [9]:
%%time
alg = ALG(**best_hyperparams)
results = evaluation.base.kFoldsEval(alg, data, nr_folds=5, seed=SEED2, retarget=RETARGET)

  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users


  0%|          | 0/10 [00:00<?, ?it/s]

Evaluating with 22178 users
MRR@5 0.015 (0.0)
MRR@20 0.019 (0.0)
Average Recall@5 0.026 (0.001)
Average Recall@20 0.063 (0.001)
CPU times: user 3min 12s, sys: 27.8 s, total: 3min 39s
Wall time: 5min 40s
