## Evaluations

In [1]:
import os
from dotenv import load_dotenv
from huggingface_hub import login
from datasets import load_dataset

  from .autonotebook import tqdm as notebook_tqdm


In [2]:
%load_ext autoreload
%autoreload 2

import utils.evaluator as evaluator
evaluate = evaluator.evaluate

In [3]:
load_dotenv(override=True)

hf_token = os.environ['HF_TOKEN']
login(hf_token, add_to_git_credential=True)

dataset = load_dataset("aslam-naseer/js-function-complexity-processed")

Token has not been saved to git credential helper.
Note: Environment variable`HF_TOKEN` is set and is the current active token independently from the token you've just configured.


[1m[31mCannot authenticate through git-credential as no helper is defined on your machine.
You might have to re-authenticate when pushing to the Hugging Face Hub.
Run the following command in your terminal in case you want to set the 'store' credential helper as default.

git config --global credential.helper store

Read https://git-scm.com/book/en/v2/Git-Tools-Credential-Storage for more details.[0m


In [10]:
test_set = dataset['test'].select(range(200))
test_size = len(test_set)

#### Evaluator tests..

In [None]:
import random
random.seed(42)

def generate_random(item):
  num = random.randint(1,101)
  return num / 10.0

evaluate(generate_random, test_set, size=test_size)

100%|██████████| 200/200 [00:00<00:00, 20214.97it/s]

[92m0.9 [91m4.8 [91m3.8 [92m0.5 [93m0.5 [91m2.0 [92m0.3 [91m5.2 [91m3.3 [91m3.4 [91m3.2 [91m5.1 [93m1.2 [91m2.8 [91m3.6 [91m4.4 [93m0.7 [91m5.6 [91m4.0 [91m4.4 [93m0.6 [93m1.1 [91m1.9 [91m5.8 [91m2.1 [91m1.4 [91m3.7 [92m0.0 [91m4.0 [91m1.3 [91m2.5 [91m1.8 [91m4.7 [91m4.6 [91m2.3 [91m1.7 [91m4.3 [91m7.5 [91m7.8 [93m0.7 [91m4.2 [91m2.5 [91m1.7 [91m2.0 [91m4.3 [91m1.6 [91m2.6 [91m2.2 [91m3.5 [92m0.1 [91m4.2 [93m0.5 [93m1.4 [91m2.1 [91m5.4 [91m4.7 [91m2.2 [93m1.7 [91m5.5 [93m0.9 [91m4.0 [91m1.6 [92m0.4 [91m4.5 [91m6.8 [93m0.7 [91m2.0 [91m2.7 [91m2.8 [91m4.3 [91m4.3 [91m4.5 [91m3.2 [91m2.3 [91m1.8 [91m1.8 [91m4.1 [91m2.0 [91m1.5 [93m0.8 [92m0.5 [91m5.2 [93m0.5 [91m7.0 [91m2.5 [92m0.2 [91m2.7 [91m5.8 [91m1.7 [92m0.4 [91m4.6 [91m1.9 [91m5.9 [91m1.4 [91m5.4 [91m1.0 [92m0.3 [93m1.2 [91m3.6 [91m5.2 [91m1.6 [91m1.6 [93m0.6 [91m1.6 [91m4.4 [92m0.6 [91m6.8 [91m7.7 [93m0.8 [91m5.6 [91m5.3 




In [None]:
def generate_five(item):
    return 5


evaluate(generate_five, test_set, size=test_size)

100%|██████████| 200/200 [00:00<00:00, 13970.54it/s]

[91m4.1 [91m1.3 [93m0.8 [91m5.0 [91m1.9 [91m3.8 [91m1.8 [91m2.0 [93m1.2 [92m0.2 [92m0.5 [93m0.6 [91m3.2 [91m1.0 [91m1.0 [91m3.9 [91m3.8 [93m1.0 [92m0.2 [91m2.2 [91m2.6 [91m2.6 [93m0.9 [93m1.2 [92m0.1 [91m3.8 [92m0.5 [91m3.4 [92m0.0 [93m0.7 [91m2.1 [91m3.9 [91m3.9 [91m2.0 [93m0.9 [91m3.2 [92m0.5 [91m4.6 [91m3.8 [93m1.2 [91m3.6 [91m3.9 [91m1.3 [92m0.2 [92m0.5 [91m2.2 [91m1.0 [91m1.6 [91m3.4 [91m3.8 [91m3.8 [92m0.0 [91m4.2 [92m0.5 [93m1.0 [92m0.3 [91m1.3 [91m3.6 [91m2.1 [91m1.0 [92m0.1 [92m0.5 [91m1.6 [91m1.4 [91m3.8 [92m0.4 [92m0.4 [92m0.2 [91m1.3 [92m0.2 [92m0.1 [91m1.0 [93m1.2 [91m2.6 [91m3.0 [91m2.1 [91m2.1 [91m1.7 [91m1.6 [93m0.6 [91m1.4 [91m2.0 [93m0.8 [91m4.1 [91m2.3 [93m0.6 [92m0.4 [91m2.2 [92m0.2 [91m4.4 [93m0.8 [91m1.4 [91m1.9 [91m1.4 [91m2.2 [91m3.8 [91m1.6 [91m3.2 [91m1.8 [91m2.3 [91m2.6 [91m1.7 [91m2.1 [91m1.6 [93m0.5 [91m2.8 [91m4.7 [91m3.9 [92m0.0 [93m0.7 [92m0.3 


