# Carregando todas as Runs

In [1]:
from pathlib import Path
from ranx import Run, Qrels

In [2]:
RUN_FOLDER = "evaluation/runs"
QRELS_PATH = 'evaluation/qrels.json'

In [3]:
source_folder = Path(RUN_FOLDER)

In [4]:
runs = []
for f in source_folder.iterdir():
  run = Run.from_file(f, name=f.stem.replace('_', ' ').replace('-', '.').capitalize())
  runs.append(run)

In [5]:
# ordenar runs por nome
runs.sort(key=lambda x: x.name)

In [6]:
qrels = Qrels.from_file(QRELS_PATH)

# Comparação entre Runs

In [7]:
from ranx import evaluate, compare

In [8]:
# METRICS = ["recall@10", 'map@10', 'hit_rate@10', 'mrr@10']
METRICS = ["recall@30", 'mrr@30']
# METRICS = 'mrr@10'

In [12]:
report = compare(
    qrels=qrels,
    runs=runs,
    metrics=METRICS,
    rounding_digits=4,
    max_p=0.05  # P-value threshold
)

In [13]:
print(report)

#    Model                    Recall@30          MRR@30
---  -----------------------  -----------------  ----------------
a    Adtw multivar            0.5486ᵉᶦ           0.8084ᵉ
b    Adtw useracceleration.x  0.5804ᵈᵉʰᶦ         0.8374ᵉ
c    Adtw useracceleration.y  0.5940ᵃᵈᵉʰᶦ        0.8612ᵈᵉʰ
d    Adtw useracceleration.z  0.5231ᵉᶦ           0.7885ᵉ
e    Ddtw multivar            0.4120             0.7164
f    Ddtw useracceleration.x  0.5804ᵈᵉʰᶦ         0.8374ᵉ
g    Ddtw useracceleration.y  0.5940ᵃᵈᵉʰᶦ        0.8612ᵈᵉʰ
h    Ddtw useracceleration.z  0.5231ᵉᶦ           0.7885ᵉ
i    Dtw multivar             0.4774ᵉ            0.9178ᵃᵇᶜᵈᵉᶠᵍʰˡ
j    Dtw useracceleration.x   0.6016ᵃᵇᵈᵉᶠʰᶦˡ     0.8735ᵃᵈᵉʰ
k    Dtw useracceleration.y   0.6797ᵃᵇᶜᵈᵉᶠᵍʰᶦʲˡ  0.9264ᵃᵇᶜᵈᵉᶠᵍʰʲˡ
l    Dtw useracceleration.z   0.5680ᵈᵉʰᶦ         0.8712ᵃᵈᵉʰ


In [11]:
print(report.to_latex())

% Add in preamble
\usepackage{graphicx}
\usepackage{booktabs}


% To change the table size, act on the resizebox argument `0.8`.
\begin{table*}[ht]
\centering
\caption{
Overall effectiveness of the models.
The best results are highlighted in boldface.
Superscripts denote significant differences in paired Student's t-test with $p \le 0.05$.
}
\resizebox{0.8\textwidth}{!}{
\begin{tabular}{c|l|c|c}
\toprule
\textbf{\#}
& \textbf{Model}
& \textbf{Recall@30}
& \textbf{MRR@30} \\ 
\midrule
a &
Adtw multivar &
0.549$^{ei}$\hphantom{$^{bcdfghjkl}$} &
0.808$^{e}$\hphantom{$^{bcdfghijkl}$} \\
b &
Adtw useracceleration.x &
0.580$^{dehi}$\hphantom{$^{acfgjkl}$} &
0.837$^{e}$\hphantom{$^{acdfghijkl}$} \\
c &
Adtw useracceleration.y &
0.594$^{adehi}$\hphantom{$^{bfgjkl}$} &
0.861$^{deh}$\hphantom{$^{abfgijkl}$} \\
d &
Adtw useracceleration.z &
0.523$^{ei}$\hphantom{$^{abcfghjkl}$} &
0.788$^{e}$\hphantom{$^{abcfghijkl}$} \\
e &
Ddtw multivar &
0.412\hphantom{$^{abcdfghijkl}$} &
0.716\hphantom{$^{abcd