In [1]:
import pandas as pd
import numpy as np
import os

# Ablation study

In [2]:
metrics = ("test_ndcg@10", "test_recall@10", "used_epochs")

ablation_study_files = [
    ("layer_size_results.csv", "hidden_layer_size"),
    ("masking_ratio_results.csv", "mask_probability"),
    ("max_sequence_length_results.csv", "max_sequence_length"),
    ("num_layers_results.csv", "num_hidden_layers"),
    ("sequence_length_results.csv", "pad_length"),
]

for file, parameter in ablation_study_files:
    df = pd.read_csv(os.path.join("results", file))
    df = df[[parameter, *metrics]]
    print(df.to_latex(index=False, escape=True))

\begin{tabular}{rrrr}
\toprule
hidden\_layer\_size & test\_ndcg@10 & test\_recall@10 & used\_epochs \\
\midrule
64 & 0.054833 & 0.065294 & 48 \\
128 & 0.055468 & 0.065808 & 34 \\
256 & 0.052526 & 0.063628 & 35 \\
\bottomrule
\end{tabular}

\begin{tabular}{rrrr}
\toprule
mask\_probability & test\_ndcg@10 & test\_recall@10 & used\_epochs \\
\midrule
0.150000 & 0.052861 & 0.062872 & 32 \\
0.200000 & 0.057110 & 0.066208 & 30 \\
0.400000 & 0.057197 & 0.068399 & 49 \\
\bottomrule
\end{tabular}

\begin{tabular}{rrrr}
\toprule
max\_sequence\_length & test\_ndcg@10 & test\_recall@10 & used\_epochs \\
\midrule
100.000000 & 0.049173 & 0.060140 & 43 \\
200.000000 & 0.052861 & 0.062872 & 32 \\
NaN & 0.054840 & 0.065045 & 41 \\
\bottomrule
\end{tabular}

\begin{tabular}{rrrr}
\toprule
num\_hidden\_layers & test\_ndcg@10 & test\_recall@10 & used\_epochs \\
\midrule
2 & 0.053056 & 0.062899 & 29 \\
4 & 0.052861 & 0.062872 & 32 \\
8 & 0.046597 & 0.058668 & 57 \\
\bottomrule
\end{tabular}

\begin{tabular

# Grid search

In [3]:
grid_search_file = "grid_search_results.csv"
search_parameters = ("pad_length", "hidden_layer_size", "learning_rate")

df = pd.read_csv(os.path.join("results", grid_search_file))

df = df[[*search_parameters, *metrics]]
df = df.sort_values(by="test_ndcg@10", ascending=False)
print(df.to_latex(escape=True, index=False))

\begin{tabular}{rrrrrr}
\toprule
pad\_length & hidden\_layer\_size & learning\_rate & test\_ndcg@10 & test\_recall@10 & used\_epochs \\
\midrule
50 & 256 & 0.000500 & 0.050443 & 0.059165 & 29 \\
50 & 256 & 0.005000 & 0.050285 & 0.059369 & 58 \\
50 & 128 & 0.001000 & 0.048963 & 0.058538 & 32 \\
50 & 128 & 0.000500 & 0.048347 & 0.057300 & 29 \\
50 & 256 & 0.001000 & 0.048196 & 0.057430 & 38 \\
50 & 128 & 0.005000 & 0.043647 & 0.053944 & 67 \\
20 & 128 & 0.001000 & 0.041422 & 0.051569 & 43 \\
20 & 256 & 0.000500 & 0.040565 & 0.050017 & 29 \\
20 & 256 & 0.001000 & 0.040169 & 0.050754 & 33 \\
20 & 128 & 0.000500 & 0.039936 & 0.048442 & 33 \\
20 & 256 & 0.005000 & 0.035651 & 0.046332 & 64 \\
20 & 128 & 0.005000 & 0.031858 & 0.042249 & 54 \\
\bottomrule
\end{tabular}

