In [1]:
import pandas as pd
from benchmark.evaluations.evaluator import Evaluator
from config import _DEFAULT_ALPHAS, _DEFAULT_THETAS

ev = Evaluator()

In [11]:
# Define parameters
dataset = 'ERing'
model = 'fcn'

In [12]:
# Storage for all summaries
all_summaries = []

# -------------------------------
# Single evaluation for Naive
# -------------------------------
naive_bm, naive_bm_summary = ev.evaluate_dataset(
    'confetti_naive', dataset, model, alpha=True, param_config=_DEFAULT_ALPHAS[0]
)
naive_bm_summary["Method"] = "Naive"
all_summaries.append(naive_bm_summary)

# -------------------------------
# Alpha sweep for Optimized
# -------------------------------
for alpha in _DEFAULT_ALPHAS:
    optimized_bm, optimized_bm_summary = ev.evaluate_dataset(
        'confetti_optimized', dataset, model, alpha=True, param_config=alpha
    )
    optimized_bm_summary["Method"] = f"Optimized Alpha {alpha}"
    all_summaries.append(optimized_bm_summary)

# -------------------------------
# Theta sweep for Optimized
# -------------------------------
for theta in _DEFAULT_THETAS:
    optimized_bm, optimized_bm_summary = ev.evaluate_dataset(
        'confetti_optimized', dataset, model, alpha=False, param_config=theta
    )
    optimized_bm_summary["Method"] = f"Optimized Theta {theta}"
    all_summaries.append(optimized_bm_summary)

# Combine all summaries
summary_df = pd.concat(all_summaries, ignore_index=True)

Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)
Shape: (30, 65, 4)


In [6]:
summary_df

Unnamed: 0,Dataset,Sparsity,Confidence,Validity,Proximity,Method
0,ArticularyWordRecognition,3.1e-05,0.97959,1.0,1780.985148,Naive
1,ArticularyWordRecognition,2.2e-05,0.978461,1.0,1761.651879,Optimized Alpha 0.1
2,ArticularyWordRecognition,1.1e-05,0.984388,1.0,1760.548563,Optimized Alpha 0.3
3,ArticularyWordRecognition,1.1e-05,0.98278,1.0,1759.705432,Optimized Alpha 0.5
4,ArticularyWordRecognition,1.1e-05,0.986101,1.0,1761.726831,Optimized Alpha 0.7
5,ArticularyWordRecognition,1.1e-05,0.987901,1.0,1760.409323,Optimized Alpha 0.9
6,ArticularyWordRecognition,1.1e-05,0.991831,1.0,1763.960613,Optimized Alpha 1.0
7,ArticularyWordRecognition,0.0,0.985767,1.0,1749.523844,Optimized Theta 0.55
8,ArticularyWordRecognition,1.3e-05,0.987857,1.0,1766.136521,Optimized Theta 0.65
9,ArticularyWordRecognition,0.0,0.988042,1.0,1770.640597,Optimized Theta 0.75


In [9]:
summary_df

Unnamed: 0,Dataset,Sparsity,Confidence,Validity,Proximity,Method
0,Libras,0.560864,0.777735,1.0,46.314489,Naive
1,Libras,0.78695,0.742342,1.0,26.839773,Optimized Alpha 0.1
2,Libras,0.789031,0.742291,1.0,26.89352,Optimized Alpha 0.3
3,Libras,0.786288,0.742838,1.0,26.899952,Optimized Alpha 0.5
4,Libras,0.784397,0.742574,1.0,26.94588,Optimized Alpha 0.7
5,Libras,0.783972,0.744657,1.0,27.083315,Optimized Alpha 0.9
6,Libras,0.722648,0.783436,1.0,29.772245,Optimized Alpha 1.0
7,Libras,0.777237,0.768105,1.0,29.382012,Optimized Theta 0.55
8,Libras,0.76171,0.825711,1.0,31.439357,Optimized Theta 0.65
9,Libras,0.75985,0.891692,1.0,36.048658,Optimized Theta 0.75


In [13]:
summary_df

Unnamed: 0,Dataset,Sparsity,Confidence,Validity,Proximity,Method
0,ERing,0.0,0.800605,0.833333,373.826806,Naive
1,ERing,0.0,0.799624,0.833333,378.940898,Optimized Alpha 0.1
2,ERing,0.0,0.793796,0.833333,377.914956,Optimized Alpha 0.3
3,ERing,0.0,0.791614,0.833333,379.731313,Optimized Alpha 0.5
4,ERing,0.0,0.792452,0.833333,379.074291,Optimized Alpha 0.7
5,ERing,0.0,0.790105,0.833333,379.020162,Optimized Alpha 0.9
6,ERing,0.0,0.798859,0.833333,378.508077,Optimized Alpha 1.0
7,ERing,0.0,0.786687,0.825397,372.03169,Optimized Theta 0.55
8,ERing,0.0,0.808584,0.821429,395.505875,Optimized Theta 0.65
9,ERing,0.0,0.775082,0.785714,383.417648,Optimized Theta 0.75
