### Dataset: LastFM
### Algorithm: ItemKNN Incremental
### Padding unknown user/item: Random
### Flow: Library Flow

In [1]:
k = 100
from streamsightv2.datasets.lastfm import LastFMDataset
from streamsightv2.settings import SlidingWindowSetting
dataset = LastFMDataset()

data = dataset.load()

setting_window = SlidingWindowSetting(
    background_t=1167550546,
    window_size=60 * 60 * 24 * 365, # 365 days
    top_K=k
)

setting_window.split(data)

INFO - streamsight package loaded.
  from .autonotebook import tqdm as notebook_tqdm

DEBUG - LastFMDataset being initialized with 'data' as the base path.
DEBUG - LastFMDataset is initialized.
INFO - LastFMDataset is loading dataset...
DEBUG - Data zipfile is in memory and in dir specified.
DEBUG - LastFMDataset applying filters set.
DEBUG - 	interactions before preprocess: 186479
DEBUG - 	items before preprocess: 12523
DEBUG - 	users before preprocess: 1892
DEBUG - 	interactions after preprocess: 186479
DEBUG - 	items after preprocess: 12523
DEBUG - 	users after preprocess: 1892
INFO - LastFMDataset dataset loaded - Took 0.0898s
DEBUG - Splitting data...
DEBUG - Performing lt(t, 2147483647)
DEBUG - Performing lt(t, 1167550546)
DEBUG - Performing ge(t, 1167550546)
DEBUG - TimestampSplitter(t=1167550546,t_lower=None,t_upper=None) has complete split


  0%|          | 0/4 [00:00<?, ?it/s]

DEBUG - NPastInteractionTimestampSplitter(t=1167550546,t_lower=None,t_upper=31536000,n_seq_data=0,include_all_past_data=False) - Updating split point to t=1167550546
DEBUG - Performing lt(t, 1199086546)
DEBUG - Performing ge(t, 1167550546)
DEBUG - Performing get_user_n_last_interaction comparison
DEBUG - NPastInteractionTimestampSplitter(t=1167550546,t_lower=None,t_upper=31536000,n_seq_data=0,include_all_past_data=False) has complete split
INFO - Split at time 1167550546 resulted in empty unlabelled testing samples.
DEBUG - NPastInteractionTimestampSplitter(t=1167550546,t_lower=None,t_upper=31536000,n_seq_data=0,include_all_past_data=False) - Updating split point to t=1199086546
DEBUG - Performing lt(t, 1230622546)
DEBUG - Performing ge(t, 1199086546)
DEBUG - Performing get_user_n_last_interaction comparison
DEBUG - NPastInteractionTimestampSplitter(t=1199086546,t_lower=None,t_upper=31536000,n_seq_data=0,include_all_past_data=False) has complete split
INFO - Split at time 1199086546 re

5it [00:00, 45.87it/s]               

INFO - Finished split with window size 31536000 seconds. Number of splits: 5 in total.
INFO - SlidingWindowSetting data split - Took 0.135s
DEBUG - Checking split attribute and sizes.
DEBUG - Checking split attributes.
DEBUG - Split attributes are set.
DEBUG - Checking size of split sets.
DEBUG - Size of split sets are checked.
INFO - SlidingWindowSetting data split complete.





In [2]:
from streamsightv2.evaluators import EvaluatorStreamerBuilder

builder = EvaluatorStreamerBuilder()
builder.add_setting(setting_window)
builder.set_metric_K(k)
builder.add_metric("PrecisionK")
builder.add_metric("RecallK")
builder.add_metric("NDCGK")
evaluator = builder.build()

In [3]:
from streamsightv2.algorithms import ItemKNNIncremental
external_model = ItemKNNIncremental(K=k, pad_with_popularity=False)
external_model_id = evaluator.register_algorithm(algorithm_name="LastFM_ItemKNN_inc_RandomPad")
print(external_model_id)

INFO - Registering algorithm name LastFM_ItemKNN_inc_RandomPad with ID: bdd640fb-0667-4ad1-9c80-317fa3b1799d
DEBUG - Algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d registered
bdd640fb-0667-4ad1-9c80-317fa3b1799d


In [4]:
evaluator.start_stream()

DEBUG - Resetting data generators.
DEBUG - Data generators are reset.
DEBUG - Preparing evaluator for streaming
DEBUG - (user x item) shape defined is (187, 3034)
DEBUG - Shape of dataframe stored in matrix was (12302, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (12302, 5) after masking
DEBUG - Final (user x item) shape defined is (187, 3034)
DEBUG - Caching evaluation data for step 1
DEBUG - (user x item) shape defined is (187, 3034)
DEBUG - Shape of dataframe stored in matrix was (11440, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (11440, 5) after masking
DEBUG - Final (user x item) shape defined is (187, 3034)
DEBUG - (user x item) shape defined is (187, 3034)
DEBUG - Shape of dataframe stored in matrix was (11440, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (7817, 5) after masking
DEBUG - Final (user x item) shape defined is (457, 3034)
DEBUG - Data cached for step 1 complete


# Iteration 1

In [5]:
data = evaluator.get_data(external_model_id)
external_model.fit(data)
data

DEBUG - Getting data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
Training data:  [[1 0 0 ... 0 0 0]
 [0 1 0 ... 0 0 0]
 [0 0 1 ... 0 0 0]
 ...
 [0 0 0 ... 0 0 0]
 [0 0 0 ... 0 0 0]
 [0 0 0 ... 0 0 0]]
Item similarities:  [[0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 ...
 [0. 0. 0. ... 0. 1. 0.]
 [0. 0. 0. ... 1. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]]
Item similarities after get_top_K_values:  [[0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 ...
 [0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 1. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]]
  warn(f"{self.name} missing similar items for {missing} items.")

DEBUG - Fitting ItemKNNIncremental complete - Took 0.311s


       interactionid  uid   iid          ts  tagID
0                  0    0     0  -428720400     39
1                  1    1     1  -420771600    103
2                  2    1     1  -420771600  10021
3                  3    2     2  -405133200   1474
4                  4    3     3   294357600    311
...              ...  ...   ...         ...    ...
12297          12297    3  1970  1164927600    102
12298          12298    3  1791  1164927600     81
12299          12299   99  3033  1164927600  11934
12300          12300    3  1791  1164927600     33
12301          12301    3   183  1164927600    387

[12302 rows x 5 columns]

In [6]:
ul_data = evaluator.get_unlabeled_data(external_model_id)
prediction = external_model.predict(data, ul_data)
ul_data

DEBUG - Getting unlabeled data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
  warn(f"{self.name} missing similar items for {missing} items.")

DEBUG - Performing items_in comparison
In ItemKNNIncremental _predict:  [[0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 ...
 [0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]]
Max user ID:  458
Max item ID:  0
X.shape:  (187, 3034)
Intended shape:  (458, 3034)
Predict frame:         interactionid  uid  iid          ts  tagID
12302          12302   24   -1  1167606000     76
12303          12303   60   -1  1167606000   1316
12304          12304   60   -1  1167606000   2664
12305          12305   76   -1  1167606000   1844
12306          12306    9   -1  1167606000   7263
...              ...  ...  ...         ...    ...
32693          32693  457   -1  1196463600   4397
32694          32694  457   -1  1196463600   1911
32695          32695  200   -1  1196463600    855
32700          32700  

       interactionid  uid  iid          ts  tagID
12302          12302   24   -1  1167606000     76
12303          12303   60   -1  1167606000   1316
12304          12304   60   -1  1167606000   2664
12305          12305   76   -1  1167606000   1844
12306          12306    9   -1  1167606000   7263
...              ...  ...  ...         ...    ...
32693          32693  457   -1  1196463600   4397
32694          32694  457   -1  1196463600   1911
32695          32695  200   -1  1196463600    855
32700          32700  315   -1  1196463600     81
32709          32709  457   -1  1196463600     79

[11440 rows x 5 columns]

In [7]:
print(prediction)
print(prediction.toarray())
evaluator.submit_prediction(external_model_id, prediction)

<Compressed Sparse Row sparse matrix of dtype 'float64'
	with 119052 stored elements and shape (458, 3034)>
  Coords	Values
  (0, 2910)	0.5773502691896258
  (0, 2896)	0.408248290463863
  (0, 2890)	0.5773502691896258
  (0, 2884)	0.5773502691896258
  (0, 2883)	0.408248290463863
  (0, 2880)	0.5773502691896258
  (0, 2879)	0.5773502691896258
  (0, 2878)	0.5773502691896258
  (0, 2877)	0.5773502691896258
  (0, 2871)	0.5773502691896258
  (0, 2865)	0.5773502691896258
  (0, 2861)	0.5773502691896258
  (0, 2856)	0.5773502691896258
  (0, 2854)	0.5773502691896258
  (0, 2853)	0.5773502691896258
  (0, 2851)	0.5773502691896258
  (0, 2849)	0.5773502691896258
  (0, 2842)	0.5773502691896258
  (0, 2835)	0.5773502691896258
  (0, 2834)	0.5773502691896258
  (0, 2832)	0.5773502691896258
  (0, 2825)	0.5773502691896258
  (0, 2821)	0.5773502691896258
  (0, 2815)	0.5773502691896258
  (0, 2814)	0.5773502691896258
  :	:
  (451, 2171)	1.0
  (451, 859)	1.0
  (451, 196)	1.0
  (451, 173)	1.0
  (452, 2300)	1.0
  (452, 22

# Iteration 2

In [8]:
data = evaluator.get_data(external_model_id)
external_model.fit(data)
data

DEBUG - Getting data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
DEBUG - (user x item) shape defined is (458, 5278)
DEBUG - Shape of dataframe stored in matrix was (20415, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (20415, 5) after masking
DEBUG - Final (user x item) shape defined is (458, 5278)
DEBUG - Caching evaluation data for step 2
DEBUG - (user x item) shape defined is (458, 5278)
DEBUG - Shape of dataframe stored in matrix was (21359, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (21359, 5) after masking
DEBUG - Final (user x item) shape defined is (458, 5278)
DEBUG - (user x item) shape defined is (458, 5278)
DEBUG - Shape of dataframe stored in matrix was (21359, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (15787, 5) after masking
DEBUG - Final (user x item) shape defined is (918, 5278)
DEBUG - Data cached for step 2 complete
Training data:  [[1. 0. 0. ... 0. 0. 0.]
 [0. 1. 0. ... 0. 0. 0.]
 [0. 

       interactionid  uid   iid          ts  tagID
12302          12302   24  3034  1167606000     76
12303          12303   60  3035  1167606000   1316
12304          12304   60  3035  1167606000   2664
12305          12305   76  3036  1167606000   1844
12306          12306    9  1224  1167606000   7263
...              ...  ...   ...         ...    ...
32712          32712  340   512  1196463600    105
32713          32713  419  2309  1196463600     72
32714          32714  340   512  1196463600    570
32715          32715  131  5275  1196463600     47
32716          32716  131  5264  1196463600    187

[20415 rows x 5 columns]

In [9]:
ul_data = evaluator.get_unlabeled_data(external_model_id)
prediction = external_model.predict(data, ul_data)
ul_data

DEBUG - Getting unlabeled data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
  warn(f"{self.name} missing similar items for {missing} items.")

DEBUG - Performing items_in comparison
In ItemKNNIncremental _predict:  [[0.         0.         0.         ... 0.57735027 0.         0.        ]
 [0.         0.         0.         ... 0.         0.         0.        ]
 [0.         0.         0.         ... 0.         0.         0.        ]
 ...
 [0.         0.         0.         ... 0.         0.         0.        ]
 [0.         0.         0.         ... 0.         0.         0.        ]
 [0.         0.         0.         ... 0.         0.         0.        ]]
Max user ID:  918
Max item ID:  0
X.shape:  (458, 5278)
Intended shape:  (918, 5278)
Predict frame:         interactionid  uid  iid          ts  tagID
32717          32717  181   -1  1199142000   3364
32718          32718  419   -1  1199142000     78
32719          32719  419   -1  1199142000    169
32720          32720  398   -1  11

       interactionid  uid  iid          ts  tagID
32717          32717  181   -1  1199142000   3364
32718          32718  419   -1  1199142000     78
32719          32719  419   -1  1199142000    169
32720          32720  398   -1  1199142000     39
32721          32721  458   -1  1199142000     47
...              ...  ...  ...         ...    ...
72968          72968  780   -1  1228086000     25
72971          72971  862   -1  1228086000    515
72973          72973  823   -1  1228086000   7938
72974          72974   91   -1  1228086000   1835
72988          72988  460   -1  1228086000     83

[21359 rows x 5 columns]

In [10]:
print(prediction)
print(prediction.toarray())
evaluator.submit_prediction(external_model_id, prediction)

<Compressed Sparse Row sparse matrix of dtype 'float64'
	with 403175 stored elements and shape (918, 5278)>
  Coords	Values
  (0, 5275)	0.5773502691896258
  (0, 5270)	0.5773502691896258
  (0, 5269)	0.5773502691896258
  (0, 5265)	0.5773502691896258
  (0, 5264)	0.5773502691896258
  (0, 5258)	0.5773502691896258
  (0, 5254)	0.5773502691896258
  (0, 5252)	0.5773502691896258
  (0, 5249)	0.5773502691896258
  (0, 5246)	0.5773502691896258
  (0, 5201)	0.5773502691896258
  (0, 5199)	0.5773502691896258
  (0, 5196)	0.5773502691896258
  (0, 5195)	0.5773502691896258
  (0, 5194)	0.5773502691896258
  (0, 5193)	0.5773502691896258
  (0, 5168)	0.5773502691896258
  (0, 4965)	0.5773502691896258
  (0, 4885)	0.5773502691896258
  (0, 4862)	0.5773502691896258
  (0, 4780)	0.5773502691896258
  (0, 4779)	0.5773502691896258
  (0, 4771)	0.5773502691896258
  (0, 4755)	0.5773502691896258
  (0, 4649)	0.5773502691896258
  :	:
  (912, 3808)	1.0
  (912, 2667)	1.0
  (912, 2200)	1.0
  (912, 1685)	1.0
  (913, 5196)	1.0
  (91

# Iteration 3

In [11]:
data = evaluator.get_data(external_model_id)
external_model.fit(data)
data

DEBUG - Getting data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
DEBUG - (user x item) shape defined is (918, 8205)
DEBUG - Shape of dataframe stored in matrix was (40273, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (40273, 5) after masking
DEBUG - Final (user x item) shape defined is (918, 8205)
DEBUG - Caching evaluation data for step 3
DEBUG - (user x item) shape defined is (918, 8205)
DEBUG - Shape of dataframe stored in matrix was (23605, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (23605, 5) after masking
DEBUG - Final (user x item) shape defined is (918, 8205)
DEBUG - (user x item) shape defined is (918, 8205)
DEBUG - Shape of dataframe stored in matrix was (23605, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (19148, 5) after masking
DEBUG - Final (user x item) shape defined is (1369, 8205)
DEBUG - Data cached for step 3 complete
Training data:  [[1. 0. 0. ... 0. 0. 0.]
 [0. 1. 0. ... 0. 0. 0.]
 [0.

       interactionid  uid   iid          ts  tagID
32717          32717  181  1332  1199142000   3364
32718          32718  419  5278  1199142000     78
32719          32719  419  5278  1199142000    169
32720          32720  398  1080  1199142000     39
32721          32721  458  5279  1199142000     47
...              ...  ...   ...         ...    ...
72985          72985  639   744  1228086000   8504
72986          72986  502  8204  1228086000    109
72987          72987  502  8200  1228086000    724
72988          72988  460  2139  1228086000     83
72989          72989  502  8200  1228086000    109

[40273 rows x 5 columns]

In [12]:
ul_data = evaluator.get_unlabeled_data(external_model_id)
prediction = external_model.predict(data, ul_data)
ul_data

DEBUG - Getting unlabeled data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
  warn(f"{self.name} missing similar items for {missing} items.")

DEBUG - Performing items_in comparison
In ItemKNNIncremental _predict:  [[0.         0.         0.         ... 0.         0.         0.        ]
 [0.         0.31622777 0.         ... 0.         0.         0.        ]
 [0.         0.         0.         ... 0.         0.         0.        ]
 ...
 [0.         0.         0.         ... 0.         0.         0.        ]
 [0.         0.         0.         ... 0.         0.         0.        ]
 [0.         0.         0.         ... 0.         0.         0.        ]]
Max user ID:  1369
Max item ID:  0
X.shape:  (918, 8205)
Intended shape:  (1369, 8205)
Predict frame:          interactionid   uid  iid          ts  tagID
72990           72990   918   -1  1230764400    176
72991           72991   412   -1  1230764400    275
72992           72992   918   -1  1230764400    227
72993           72993   

        interactionid   uid  iid          ts  tagID
72990           72990   918   -1  1230764400    176
72991           72991   412   -1  1230764400    275
72992           72992   918   -1  1230764400    227
72993           72993   460   -1  1230764400     15
72994           72994   196   -1  1230764400    187
...               ...   ...  ...         ...    ...
116338         116338   456   -1  1259622000    693
116341         116341   207   -1  1259622000    387
116347         116347   207   -1  1259622000    191
116348         116348  1339   -1  1259622000   4228
116351         116351   456   -1  1259622000    432

[23605 rows x 5 columns]

In [13]:
print(prediction)
print(prediction.toarray())
evaluator.submit_prediction(external_model_id, prediction)

<Compressed Sparse Row sparse matrix of dtype 'float64'
	with 937604 stored elements and shape (1369, 8205)>
  Coords	Values
  (0, 8068)	0.5
  (0, 8014)	0.5
  (0, 7772)	0.5
  (0, 7763)	0.35355339059327373
  (0, 7678)	0.35355339059327373
  (0, 7637)	0.5
  (0, 7406)	0.5
  (0, 7401)	0.5
  (0, 7399)	0.5
  (0, 7396)	0.5
  (0, 7365)	0.5
  (0, 7350)	0.5
  (0, 7349)	0.5
  (0, 7271)	0.5
  (0, 6654)	0.35355339059327373
  (0, 6574)	0.5
  (0, 6304)	0.35355339059327373
  (0, 6133)	0.35355339059327373
  (0, 6082)	0.35355339059327373
  (0, 5384)	0.5
  (0, 5265)	0.5
  (0, 5246)	0.35355339059327373
  (0, 5199)	0.5
  (0, 5196)	0.5
  (0, 5195)	0.35355339059327373
  :	:
  (1365, 2811)	1.0
  (1365, 2683)	1.0
  (1365, 413)	1.0
  (1366, 7679)	1.0
  (1366, 7528)	1.0
  (1366, 7497)	1.0
  (1366, 7463)	1.0
  (1366, 6589)	1.0
  (1366, 6405)	1.0
  (1366, 5319)	1.0
  (1366, 4602)	1.0
  (1366, 3660)	1.0
  (1366, 3632)	1.0
  (1366, 3314)	1.0
  (1366, 3001)	1.0
  (1366, 2429)	1.0
  (1366, 2239)	1.0
  (1366, 2236)	1.0


# Iteration 4

In [14]:
data = evaluator.get_data(external_model_id)
external_model.fit(data)
data

DEBUG - Getting data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
DEBUG - (user x item) shape defined is (1369, 10380)
DEBUG - Shape of dataframe stored in matrix was (43366, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (43366, 5) after masking
DEBUG - Final (user x item) shape defined is (1369, 10380)
DEBUG - Caching evaluation data for step 4
DEBUG - (user x item) shape defined is (1369, 10380)
DEBUG - Shape of dataframe stored in matrix was (27243, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (27243, 5) after masking
DEBUG - Final (user x item) shape defined is (1369, 10380)
DEBUG - (user x item) shape defined is (1369, 10380)
DEBUG - Shape of dataframe stored in matrix was (27243, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (23382, 5) after masking
DEBUG - Final (user x item) shape defined is (1821, 10380)
DEBUG - Data cached for step 4 complete
Training data:  [[1. 0. 0. ... 0. 0. 0.]
 [0. 1. 0. ... 0. 

        interactionid   uid   iid          ts  tagID
72990           72990   918  2027  1230764400    176
72991           72991   412  1223  1230764400    275
72992           72992   918  5332  1230764400    227
72993           72993   460  2144  1230764400     15
72994           72994   196  1446  1230764400    187
...               ...   ...   ...         ...    ...
116351         116351   456  1306  1259622000    432
116352         116352   739   376  1259622000     16
116353         116353  1301  1095  1259622000    847
116354         116354  1115   736  1259622000    134
116355         116355   428  3980  1259622000   8304

[43366 rows x 5 columns]

In [15]:
ul_data = evaluator.get_unlabeled_data(external_model_id)
prediction = external_model.predict(data, ul_data)
ul_data

DEBUG - Getting unlabeled data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
  warn(f"{self.name} missing similar items for {missing} items.")

DEBUG - Performing items_in comparison
In ItemKNNIncremental _predict:  [[0. 0. 0. ... 0. 0. 0.]
 [0. 1. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 ...
 [0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]
 [0. 0. 0. ... 0. 0. 0.]]
Max user ID:  1821
Max item ID:  0
X.shape:  (1369, 10380)
Intended shape:  (1821, 10380)
Predict frame:          interactionid   uid  iid          ts  tagID
116356         116356   220   -1  1262300400    386
116357         116357   220   -1  1262300400    387
116358         116358   220   -1  1262300400    147
116359         116359   220   -1  1262300400    386
116360         116360   220   -1  1262300400     72
...               ...   ...  ...         ...    ...
171349         171349  1815   -1  1291158000     73
171350         171350  1815   -1  1291158000     81
171351         171351  1801   -1  1291158000    2

        interactionid   uid  iid          ts  tagID
116356         116356   220   -1  1262300400    386
116357         116357   220   -1  1262300400    387
116358         116358   220   -1  1262300400    147
116359         116359   220   -1  1262300400    386
116360         116360   220   -1  1262300400     72
...               ...   ...  ...         ...    ...
171349         171349  1815   -1  1291158000     73
171350         171350  1815   -1  1291158000     81
171351         171351  1801   -1  1291158000    275
171352         171352  1815   -1  1291158000    134
171353         171353  1698   -1  1291158000     16

[27243 rows x 5 columns]

In [16]:
print(prediction)
print(prediction.toarray())
evaluator.submit_prediction(external_model_id, prediction)

<Compressed Sparse Row sparse matrix of dtype 'float64'
	with 1554342 stored elements and shape (1821, 10380)>
  Coords	Values
  (0, 9542)	0.5
  (0, 9537)	0.35355339059327373
  (0, 9536)	0.5
  (0, 9336)	0.5
  (0, 9288)	0.5
  (0, 9076)	0.35355339059327373
  (0, 8460)	0.35355339059327373
  (0, 8427)	0.5
  (0, 8372)	0.5
  (0, 8014)	0.5
  (0, 7772)	0.35355339059327373
  (0, 7763)	0.35355339059327373
  (0, 7406)	0.5
  (0, 7401)	0.35355339059327373
  (0, 7399)	0.35355339059327373
  (0, 7396)	0.35355339059327373
  (0, 7365)	0.35355339059327373
  (0, 7349)	0.35355339059327373
  (0, 7271)	0.35355339059327373
  (0, 7033)	0.35355339059327373
  (0, 6574)	0.35355339059327373
  (0, 6304)	0.35355339059327373
  (0, 6158)	0.4082482904638631
  (0, 6082)	0.35355339059327373
  (0, 6031)	0.35355339059327373
  :	:
  (1816, 9590)	1.0
  (1816, 9392)	1.0
  (1816, 8176)	1.0
  (1816, 7484)	1.0
  (1816, 6477)	1.0
  (1816, 5159)	1.0
  (1816, 4231)	1.0
  (1816, 3940)	1.0
  (1816, 3316)	1.0
  (1816, 1456)	1.0
  (181

# Iteration 5

In [17]:
data = evaluator.get_data(external_model_id)
external_model.fit(data)
data

DEBUG - Getting data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
DEBUG - (user x item) shape defined is (1821, 12146)
DEBUG - Shape of dataframe stored in matrix was (54998, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (54998, 5) after masking
DEBUG - Final (user x item) shape defined is (1821, 12146)
DEBUG - Caching evaluation data for step 5
DEBUG - (user x item) shape defined is (1821, 12146)
DEBUG - Shape of dataframe stored in matrix was (10224, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (10224, 5) after masking
DEBUG - Final (user x item) shape defined is (1821, 12146)
DEBUG - (user x item) shape defined is (1821, 12146)
DEBUG - Shape of dataframe stored in matrix was (10224, 5) before masking
DEBUG - Shape of dataframe stored in matrix is now (9342, 5) after masking
DEBUG - Final (user x item) shape defined is (1890, 12146)
DEBUG - Data cached for step 5 complete
Training data:  [[2. 0. 0. ... 0. 0. 0.]
 [0. 1. 0. ... 0. 0

        interactionid   uid    iid          ts  tagID
116356         116356   220   1473  1262300400    386
116357         116357   220    528  1262300400    387
116358         116358   220   1554  1262300400    147
116359         116359   220   2352  1262300400    386
116360         116360   220  10380  1262300400     72
...               ...   ...    ...         ...    ...
171349         171349  1815  10021  1291158000     73
171350         171350  1815  10021  1291158000     81
171351         171351  1801     30  1291158000    275
171352         171352  1815  10021  1291158000    134
171353         171353  1698    202  1291158000     16

[54998 rows x 5 columns]

In [18]:
ul_data = evaluator.get_unlabeled_data(external_model_id)
prediction = external_model.predict(data, ul_data)
ul_data

DEBUG - Getting unlabeled data for algorithm bdd640fb-0667-4ad1-9c80-317fa3b1799d
  warn(f"{self.name} missing similar items for {missing} items.")

DEBUG - Performing items_in comparison
In ItemKNNIncremental _predict:  [[41.15391353  0.          0.         ...  1.08648127  0.30151134
   0.        ]
 [ 0.30588765 11.28697563  0.         ...  0.          0.
   0.        ]
 [ 0.          0.          0.90906006 ...  0.          0.30151134
   0.        ]
 ...
 [ 0.          0.          0.         ...  0.          0.
   0.        ]
 [ 0.          0.          0.         ...  0.          0.
   0.        ]
 [ 0.          0.          0.         ...  0.          0.
   0.        ]]
Max user ID:  1892
Max item ID:  0
X.shape:  (1821, 12146)
Intended shape:  (1892, 12146)
Predict frame:          interactionid   uid  iid          ts  tagID
171354         171354   853   -1  1293836400     24
171355         171355   853   -1  1293836400    130
171356         171356  1801   -1  1293836400    275
17135

        interactionid   uid  iid          ts  tagID
171354         171354   853   -1  1293836400     24
171355         171355   853   -1  1293836400    130
171356         171356  1801   -1  1293836400    275
171357         171357  1186   -1  1293836400    424
171358         171358  1404   -1  1293836400     39
...               ...   ...  ...         ...    ...
186445         186445  1237   -1  1304940155    389
186446         186446  1237   -1  1304940165     80
186447         186447  1237   -1  1304940174    481
186448         186448  1237   -1  1304940176    121
186449         186449  1237   -1  1304940176    121

[10224 rows x 5 columns]

In [19]:
print(prediction)
print(prediction.toarray())
evaluator.submit_prediction(external_model_id, prediction)

<Compressed Sparse Row sparse matrix of dtype 'float64'
	with 2162951 stored elements and shape (1892, 12146)>
  Coords	Values
  (0, 12056)	150.64822738115694
  (0, 12055)	150.40854166667353
  (0, 12054)	151.3551796143842
  (0, 12049)	149.52072762357062
  (0, 12044)	149.8761468138766
  (0, 11957)	47.87943391945251
  (0, 11952)	153.43253675569977
  (0, 11951)	151.78904498183692
  (0, 11950)	151.61718957424003
  (0, 11949)	153.13224848365044
  (0, 11948)	151.38437326470594
  (0, 11946)	152.3020555773516
  (0, 11945)	151.26236933063365
  (0, 11944)	149.9755479423636
  (0, 11937)	53.077831408434086
  (0, 11933)	149.37641238555042
  (0, 11931)	150.6026629433513
  (0, 11930)	150.02020614110208
  (0, 11929)	150.3178601774092
  (0, 11927)	150.24513801405766
  (0, 11926)	44.440097578106446
  (0, 11925)	150.01224358137415
  (0, 11924)	150.6739892951444
  (0, 11923)	151.55413437975747
  (0, 11922)	50.63465358969
  :	:
  (1887, 1651)	1.0
  (1887, 1211)	1.0
  (1887, 516)	1.0
  (1887, 101)	1.0
  (18

# evaluate metrics

In [20]:
evaluator.get_all_algorithm_status()

{'LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d': <AlgorithmStateEnum.COMPLETED: 'COMPLETED'>}

In [21]:
evaluator.metric_results("macro")

Unnamed: 0_level_0,Unnamed: 1_level_0,macro_score,num_window
Algorithm,Metric,Unnamed: 2_level_1,Unnamed: 3_level_1
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,NDCGK_100,0.067357,5
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,PrecisionK_100,0.012304,5
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,RecallK_100,0.142795,5


In [22]:
evaluator.metric_results("micro")


Unnamed: 0_level_0,Unnamed: 1_level_0,micro_score,num_user
Algorithm,Metric,Unnamed: 2_level_1,Unnamed: 3_level_1
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,NDCGK_100,0.066827,3282
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,PrecisionK_100,0.012322,3282
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,RecallK_100,0.141486,3282


In [23]:
evaluator.metric_results("user")

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,user_id,score
Algorithm,Timestamp,Metric,Unnamed: 3_level_1,Unnamed: 4_level_1
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1167550546,PrecisionK_100,3,0.0
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1167550546,PrecisionK_100,4,0.02
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1167550546,PrecisionK_100,8,0.0
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1167550546,PrecisionK_100,9,0.13
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1167550546,PrecisionK_100,12,0.0
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,...,...,...,...
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1293694546,NDCGK_100,1885,0.0
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1293694546,NDCGK_100,1886,0.0
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1293694546,NDCGK_100,1887,0.0
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1293694546,NDCGK_100,1888,0.0


In [24]:
evaluator.metric_results("window")

Unnamed: 0_level_0,Unnamed: 1_level_0,Unnamed: 2_level_0,window_score,num_user
Algorithm,Timestamp,Metric,Unnamed: 3_level_1,Unnamed: 4_level_1
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1167550546,PrecisionK_100,0.010787,356
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1167550546,RecallK_100,0.091245,356
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1167550546,NDCGK_100,0.048881,356
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1199086546,PrecisionK_100,0.011216,658
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1199086546,RecallK_100,0.093765,658
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1199086546,NDCGK_100,0.05187,658
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1230622546,PrecisionK_100,0.012211,805
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1230622546,RecallK_100,0.129347,805
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1230622546,NDCGK_100,0.060363,805
LastFM_ItemKNN_inc_RandomPad_bdd640fb-0667-4ad1-9c80-317fa3b1799d,t=1262158546,PrecisionK_100,0.012231,937
