In [1]:
import pandas as pd
import numpy as np
import regex #dev
from nltk.translate.bleu_score import sentence_bleu
from nltk.translate.meteor_score import meteor_score
from langchain_community.embeddings import GPT4AllEmbeddings
from langchain_community.embeddings import HuggingFaceEmbeddings
from sklearn.metrics.pairwise import cosine_similarity
from sentence_transformers import SentenceTransformer, util
from nltk.translate.meteor_score import meteor_score


  from .autonotebook import tqdm as notebook_tqdm


In [2]:
from nltk.translate.bleu_score import sentence_bleu

def score_bleu(pred:str, y:str, type=2): 
    if type == 4:
        weights = [0.25, 0.25, 0.25, 0.25]
    elif type == 3:
        weights = [0.33, 0.33, 0.33]
    elif type == 2:
        weights = [0.5, 0.5]
    res = []
    for xe, ye in zip(pred, y):
        res.append(sentence_bleu([list(xe)], list(ye), weights))
    
    return np.average(res)
    
def _embedding_cosine_similarity(x:str, y:str, embedding_fun) -> float:
    X = embedding_fun.embed_query(x)
    Y = embedding_fun.embed_query(y)
    return cosine_similarity([X], [Y])

def embedding_cosine_similarity(x:str, y:str, embedding_fun) -> float:
    res = []
    for xe, ye in zip(x, y):
        res.append(_embedding_cosine_similarity(xe, ye, embedding_fun))
    return np.average(res)

def score_meteor(pred:str, y:str) -> float:
    res = []
    for xe, ye in zip(pred, y):
        res.append(meteor_score([xe.split()], ye.split()))
    
    return np.average(res)

In [3]:
from pprint import pprint


def validate(val_file, pred_file, emb_fun):
    dfy = pd.read_csv(val_file)
    dfg = pd.read_csv(pred_file)

    y = dfy.steps.values
    # y = dfy.response.values
    pred = dfg.result.values

    bl2 = score_bleu(y, pred, 2)
    bl3 = score_bleu(y, pred, 3)
    bl4 = score_bleu(y, pred, 4)
    cosim = embedding_cosine_similarity(y, pred, emb_fun)
    meteor = score_meteor(y, pred)
    pprint(
        {
            "dataset": pred_file,
            "cosim" : cosim,
            "bleu_2" : bl2,
            "bleu_3" : bl3,
            "bleu_4" : bl4,
            "meteor" : meteor,
        }
    )
    return bl2, bl3, bl4, cosim



In [4]:
emb_fun = GPT4AllEmbeddings()
# emb_fun = HuggingFaceEmbeddings(model_name="BAAI/bge-large-en-v1.5")


bert_load_from_file: gguf version     = 2
bert_load_from_file: gguf alignment   = 32
bert_load_from_file: gguf data offset = 695552
bert_load_from_file: model name           = BERT
bert_load_from_file: model architecture   = bert
bert_load_from_file: model file type      = 1
bert_load_from_file: bert tokenizer vocab = 30522


In [5]:
# CBR_10_50 = "cbr_10_50_gpt2_results_p.csv"
# CBR_10_100 = "cbr_10_100_gpt2_results_p.csv"
# CBR_15_30 = "cbr_15_30_gpt2_results_p.csv"
# CBR_15_70 = "cbr_15_70_gpt2_results_p.csv"
# CBR_20_50 = "cbr_20_50_gpt2_results_p.csv"
# CBR_2_4NF = "cbr_2_4_nf_gpt2_results_p.csv"

In [6]:
VAL = "_validation.csv"
PE = "validation_pe2_gpt2_results_p.csv"
CBR_10_00 = "validation_cbr_00_gpt2_results_p.csv"


CBR_1_0 = "cbr_1_0_f_gpt2_results_p.csv"
CBR_1_1 = "cbr_1_1_f_gpt2_results_p.csv"
CBR_1_2 = "cbr_1_2_f_gpt2_results_p.csv"
CBR_1_3 = "cbr_1_3_f_gpt2_results_p.csv"
CBR_1_4 = "cbr_1_4_f_gpt2_results_p.csv"
CBR_1_5 = "cbr_1_5_f_gpt2_results_p.csv"
CBR_2_0 = "cbr_2_0_f_gpt2_results_p.csv"
CBR_2_2 = "cbr_2_2_f_gpt2_results_p.csv"
CBR_2_4 = "cbr_2_4_f_gpt2_results_p.csv"
CBR_2_6 = "cbr_2_6_f_gpt2_results_p.csv"
CBR_2_8 = "cbr_2_8_f_gpt2_results_p.csv"
CBR_3_0 = "cbr_3_0_f_gpt2_results_p.csv"
CBR_AUGMENTATION = "cbr_augmentation_gpt2_results_p.csv"
CBR_AUGMENTATION_INPUT = "_cbr_augmentation.csv"

CBR_0_10 = "cbr_0_10_f_gpt2_results_p.csv"
CBR_0_18 = "cbr_0_18_f_gpt2_results_p.csv"
CBR_1_9 = "cbr_1_9_f_gpt2_results_p.csv"
CBR_3_3 = "cbr_3_3_f_gpt2_results_p.csv"
CBR_3_6 = "cbr_3_6_f_gpt2_results_p.csv"
CBR_3_9 = "cbr_3_9_f_gpt2_results_p.csv"
CBR_3_12 = "cbr_3_12_f_gpt2_results_p.csv"
CBR_4_0 = "cbr_4_0_f_gpt2_results_p.csv"
CBR_4_4 = "cbr_4_4_f_gpt2_results_p.csv"
CBR_4_8 = "cbr_4_8_f_gpt2_results_p.csv"
CBR_5_0 = "cbr_5_0_f_gpt2_results_p.csv"
CBR_5_5 = "cbr_5_5_f_gpt2_results_p.csv"
CBR_8_2 = "cbr_8_2_f_gpt2_results_p.csv"
CBR_9_1 = "cbr_9_1_f_gpt2_results_p.csv"
CBR_10_5 = "cbr_10_5_f_gpt2_results_p.csv"
CBR_10_18 = "cbr_10_18_f_gpt2_results_p.csv"
CBR_1_7 = "cbr_1_7_f_gpt2_results_p.csv"


validate(VAL, CBR_1_7, emb_fun)
# validate(VAL, CBR_0_10, emb_fun)
# validate(VAL, CBR_0_18, emb_fun)
# validate(VAL, CBR_1_9, emb_fun)
# validate(VAL, CBR_3_3, emb_fun)
# validate(VAL, CBR_3_6, emb_fun)
# validate(VAL, CBR_3_9, emb_fun)
# validate(VAL, CBR_3_12, emb_fun)
# validate(VAL, CBR_4_0, emb_fun)
# validate(VAL, CBR_4_4, emb_fun)
# validate(VAL, CBR_4_8, emb_fun)
# validate(VAL, CBR_5_0, emb_fun)
# validate(VAL, CBR_5_5, emb_fun)
# validate(VAL, CBR_8_2, emb_fun)
# validate(VAL, CBR_9_1, emb_fun)
# validate(VAL, CBR_10_5, emb_fun)
# validate(VAL, CBR_10_18, emb_fun)

# validate(CBR_AUGMENTATION_INPUT, CBR_AUGMENTATION, emb_fun)

# validate(VAL, CBR_1_0, emb_fun)
# validate(VAL, CBR_1_1, emb_fun)
# validate(VAL, CBR_1_2, emb_fun)
# validate(VAL, CBR_1_3, emb_fun)
# validate(VAL, CBR_1_4, emb_fun)
# validate(VAL, CBR_1_5, emb_fun)
# validate(VAL, CBR_2_0, emb_fun)
validate(VAL, CBR_2_2, emb_fun)
# validate(VAL, CBR_2_4, emb_fun)
# validate(VAL, CBR_2_6, emb_fun)
# validate(VAL, CBR_2_8, emb_fun)
# validate(VAL, CBR_3_0, emb_fun)

# validate(VAL, PE, emb_fun)
# validate(VAL, CBR_10_00, emb_fun)
# validate(VAL, CBR_10_50, emb_fun)
# validate(VAL, CBR_10_100, emb_fun)
# validate(VAL, CBR_15_30, emb_fun)
# validate(VAL, CBR_15_70, emb_fun)
# validate(VAL, CBR_20_50, emb_fun)

print()

{'bleu_2': 0.5167929124108913,
 'bleu_3': 0.4127503923426222,
 'bleu_4': 0.3282499017714824,
 'cosim': 0.6416441626815853,
 'dataset': 'cbr_1_7_f_gpt2_results_p.csv',
 'meteor': 0.16849076754715425}
{'bleu_2': 0.49909559360747796,
 'bleu_3': 0.39813183923674667,
 'bleu_4': 0.31646266158562036,
 'cosim': 0.6404896416096827,
 'dataset': 'cbr_2_2_f_gpt2_results_p.csv',
 'meteor': 0.16224721347903298}



In [7]:
# 2000 samples - GPT2
{'bleu_2': 0.3983345205866027,
 'bleu_3': 0.30944811693835267,
 'bleu_4': 0.24022563642876657,
    'cosim': 0.5424127484702235,
 'dataset': 'validation_pe2_gpt2_results_p.csv'}
{'bleu_2': 0.48248109421980445,
 'bleu_3': 0.3905828115755981,
 'bleu_4': 0.31578191811376116,
    'cosim': 0.666354314896669,
 'dataset': 'validation_cbr_00_gpt2_results_p.csv'}

{'bleu_2': 0.5135314303899466,
 'bleu_3': 0.41031691972928647,
 'bleu_4': 0.3264546186759959,
 'cosim': 0.6420897206142041,
 'dataset': 'cbr_2_4_f_gpt2_results_p.csv',
 'meteor': 0.16761964253627915}
{'bleu_2': 0.48632734961526564,
 'bleu_3': 0.3888256968568053,
 'bleu_4': 0.3098112808075717,
 'cosim': 0.6381431812683747,
 'dataset': 'cbr_2_4_nf_gpt2_results_p.csv',
 'meteor': 0.16152027514060094}

{'bleu_2': 0.4605249371516188,
 'bleu_3': 0.3672828277689744,
 'bleu_4': 0.29242323187765523,
 'cosim': 0.6224588947749784,
 'dataset': 'cbr_1_0_f_gpt2_results_p.csv',
 'meteor': 0.15114901895701202}
{'bleu_2': 0.5008532851272113,
 'bleu_3': 0.39895022542948766,
 'bleu_4': 0.3165822916399227,
 'cosim': 0.631748446641241,
 'dataset': 'cbr_1_1_f_gpt2_results_p.csv',
 'meteor': 0.1601358745813599}
{'bleu_2': 0.5049481615752992,
 'bleu_3': 0.4020262137516014,
 'bleu_4': 0.3188933045415751,
 'cosim': 0.6329555036721813,
 'dataset': 'cbr_1_2_f_gpt2_results_p.csv',
 'meteor': 0.16276269476505337}
{'bleu_2': 0.5098409318751849,
 'bleu_3': 0.4063832063225951,
 'bleu_4': 0.32248182803840475,
 'cosim': 0.6363822328154993,
 'dataset': 'cbr_1_3_f_gpt2_results_p.csv',
 'meteor': 0.164120997339497}
{'bleu_2': 0.513961780083978,
 'bleu_3': 0.4094480384487455,
 'bleu_4': 0.3247703624896944,
 'cosim': 0.6366393653544963,
 'dataset': 'cbr_1_4_f_gpt2_results_p.csv',
 'meteor': 0.16580318468529792}
{'bleu_2': 0.5172688570409628,
 'bleu_3': 0.4125801679194503,
 'bleu_4': 0.32743888409062727,
 'cosim': 0.638217141540082,
 'dataset': 'cbr_1_5_f_gpt2_results_p.csv',
 'meteor': 0.16643223634061743}
{'bleu_2': 0.47266690834986086,
 'bleu_3': 0.37809412949835436,
 'bleu_4': 0.30183699777312034,
 'cosim': 0.6387646681933659,
 'dataset': 'cbr_2_0_f_gpt2_results_p.csv',
 'meteor': 0.15432693611617967}
{'bleu_2': 0.5135314303899466,
 'bleu_3': 0.41031691972928647,
 'bleu_4': 0.3264546186759959,
 'cosim': 0.6420897206142041,
 'dataset': 'cbr_2_4_f_gpt2_results_p.csv',
 'meteor': 0.16761964253627915}
{'bleu_2': 0.49909559360747796,
 'bleu_3': 0.39813183923674667,
 'bleu_4': 0.31646266158562036,
 'cosim': 0.6404896416096827,
 'dataset': 'cbr_2_2_f_gpt2_results_p.csv',
 'meteor': 0.16224721347903298}
{'bleu_2': 0.5214425292241511,
 'bleu_3': 0.4174974315934158,
 'bleu_4': 0.332821690302636,
 'cosim': 0.6459960499079649,
 'dataset': 'cbr_2_6_f_gpt2_results_p.csv',
 'meteor': 0.1708053471636928}
{'bleu_2': 0.5229039327917592,
 'bleu_3': 0.418502965262687,
 'bleu_4': 0.33367062800861697,
 'cosim': 0.6506090559416784,
 'dataset': 'cbr_2_8_f_gpt2_results_p.csv',
 'meteor': 0.17140731978413712}
{'bleu_2': 0.48356388677090023,
 'bleu_3': 0.3881083293437209,
 'bleu_4': 0.310789009549226,
 'cosim': 0.6425574850372006,
 'dataset': 'cbr_3_0_f_gpt2_results_p.csv',
 'meteor': 0.16026034732989472}
{'bleu_2': 0.5210172283424189,
 'bleu_3': 0.4173593512658833,
 'bleu_4': 0.3327383887248683,
 'cosim': 0.6441947974209954,
 'dataset': 'cbr_0_10_f_gpt2_results_p.csv',
 'meteor': 0.17272521652790115}
{'bleu_2': 0.5197705470178512,
 'bleu_3': 0.416759406737027,
 'bleu_4': 0.3326414169474309,
 'cosim': 0.649753714162366,
 'dataset': 'cbr_0_18_f_gpt2_results_p.csv',
 'meteor': 0.17322264852931543}
{'bleu_2': 0.5216893583254358,
 'bleu_3': 0.4173774451228745,
 'bleu_4': 0.3324749911469302,
 'cosim': 0.6453255492557426,
 'dataset': 'cbr_1_9_f_gpt2_results_p.csv',
 'meteor': 0.17045876332388263}
{'bleu_2': 0.5047387006841945,
 'bleu_3': 0.40376421021598297,
 'bleu_4': 0.32185587116777337,
 'cosim': 0.6444761763276391,
 'dataset': 'cbr_3_3_f_gpt2_results_p.csv',
 'meteor': 0.16618162933892047}
{'bleu_2': 0.5180327774132464,
 'bleu_3': 0.4156391698850392,
 'bleu_4': 0.3319224225672656,
 'cosim': 0.6519588623305002,
 'dataset': 'cbr_3_6_f_gpt2_results_p.csv',
 'meteor': 0.17263288786907602}
{'bleu_2': 0.5196454516077718,
 'bleu_3': 0.4166248807429604,
 'bleu_4': 0.33280017541286117,
 'cosim': 0.6528032255301622,
 'dataset': 'cbr_3_9_f_gpt2_results_p.csv',
 'meteor': 0.17285133284904217}
{'bleu_2': 0.5203235631285001,
 'bleu_3': 0.41707700842492973,
 'bleu_4': 0.3330261711786993,
 'cosim': 0.6506451983578166,
 'dataset': 'cbr_3_12_f_gpt2_results_p.csv',
 'meteor': 0.17264388931851066}
{'bleu_2': 0.4910358161163606,
 'bleu_3': 0.3942748163935558,
 'bleu_4': 0.3158869650348131,
 'cosim': 0.6516947415521269,
 'dataset': 'cbr_4_0_f_gpt2_results_p.csv',
 'meteor': 0.16155180164700056}
{'bleu_2': 0.5111345025749867,
 'bleu_3': 0.4095380125260628,
 'bleu_4': 0.3268232787564083,
 'cosim': 0.6483400573385137,
 'dataset': 'cbr_4_4_f_gpt2_results_p.csv',
 'meteor': 0.16775905806355731}
{'bleu_2': 0.5171074896986763,
 'bleu_3': 0.4151533521436935,
 'bleu_4': 0.33211842005614167,
 'cosim': 0.6532945395387142,
 'dataset': 'cbr_4_8_f_gpt2_results_p.csv',
 'meteor': 0.172740328417105}
{'bleu_2': 0.48996431818240754,
 'bleu_3': 0.3940614003882808,
 'bleu_4': 0.3164033803634824,
 'cosim': 0.6545035875589263,
 'dataset': 'cbr_5_0_f_gpt2_results_p.csv',
 'meteor': 0.16423983383010266}
{'bleu_2': 0.5163420213910953,
 'bleu_3': 0.4140777800798072,
 'bleu_4': 0.3309043846991809,
 'cosim': 0.6515908427279156,
 'dataset': 'cbr_5_5_f_gpt2_results_p.csv',
 'meteor': 0.17166272327123733}
{'bleu_2': 0.5005480642302962,
 'bleu_3': 0.4030082175204756,
 'bleu_4': 0.32381264206423965,
 'cosim': 0.6584410176935936,
 'dataset': 'cbr_8_2_f_gpt2_results_p.csv',
 'meteor': 0.16994776456099742}
{'bleu_2': 0.49409454046227586,
 'bleu_3': 0.3987899141304889,
 'bleu_4': 0.3213637166094768,
 'cosim': 0.6630548355943967,
 'dataset': 'cbr_9_1_f_gpt2_results_p.csv',
 'meteor': 0.170006741556408}
{'bleu_2': 0.5062911437712141,
 'bleu_3': 0.4081891377092729,
 'bleu_4': 0.32821061123062034,
 'cosim': 0.6603016403949443,
 'dataset': 'cbr_10_5_f_gpt2_results_p.csv',
 'meteor': 0.1730870390747991}
{'bleu_2': 0.5192090706927773,
 'bleu_3': 0.4165542778817735,
 'bleu_4': 0.3332096566084734,
 'cosim': 0.6555820014800237,
 'dataset': 'cbr_10_18_f_gpt2_results_p.csv',
 'meteor': 0.17249109912106023}









{'bleu_2': 0.4875288455046744,
 'bleu_3': 0.39074283373782803,
 'bleu_4': 0.3122268349424152,
    'cosim': 0.6433889681771227,
 'dataset': 'cbr_10_50_gpt2_results_p.csv'}
{'bleu_2': 0.4985678191902936,
 'bleu_3': 0.3978690493508338,
 'bleu_4': 0.31649502545970315,
    'cosim': 0.6352831140826022,
 'dataset': 'cbr_10_100_gpt2_results_p.csv'}
{'bleu_2': 0.4919166557435214,
 'bleu_3': 0.3961473599890203,
 'bleu_4': 0.31835774297098984,
    'cosim': 0.6558141635765466,
 'dataset': 'cbr_15_30_gpt2_results_p.csv'}
{'bleu_2': 0.4986479916420456,
 'bleu_3': 0.3996324961871879,
 'bleu_4': 0.3194464705249102,
 'cosim': 0.6467255276049088,
 'dataset': 'cbr_15_70_gpt2_results_p.csv'}
{'bleu_2': 0.49940841452170787,
 'bleu_3': 0.4017801137519504,
 'bleu_4': 0.3224362106657506,
    'cosim': 0.6543811180657189,
 'dataset': 'cbr_20_50_gpt2_results_p.csv'}



# 10K augmentation evaluation

{'bleu_2': 0.48617813323490583,
 'bleu_3': 0.39406017970159696,
 'bleu_4': 0.31886395039233456,
 'cosim': 0.6635087819509142,
 'dataset': 'cbr_augmentation_gpt2_results_p.csv',
 'meteor': 0.1714686777360262}


{'bleu_2': 0.48617813323490583,
 'bleu_3': 0.39406017970159696,
 'bleu_4': 0.31886395039233456,
 'cosim': 0.6635087819509142,
 'dataset': 'cbr_augmentation_gpt2_results_p.csv',
 'meteor': 0.1714686777360262}

In [8]:
# 1000 samples - LLama 7B

{'bleu_2': 0.5303783219506372,
 'bleu_3': 0.4462962309433792,
 'bleu_4': 0.3753365885749213,
 'cosim': 0.7618514457651429,
 'dataset': 'validation_pe2_results.csv'}

# 1000 samples - GPT2

{'bleu_2': 0.2994730175354327,
 'bleu_3': 0.23035581694045432,
 'bleu_4': 0.17846223814285703,
 'cosim': 0.531551547892038,
 'dataset': 'processed_results_pe2.csv'}

{'bleu_2': 0.3870437972012796,
 'bleu_3': 0.3131764675272803,
 'bleu_4': 0.2539475163866975,
 'cosim': 0.6280271330429938,
 'dataset': 'processed_results_cbr.csv'}

{'bleu_2': 0.3870437972012796,
 'bleu_3': 0.3131764675272803,
 'bleu_4': 0.2539475163866975,
 'cosim': 0.6280271330429938,
 'dataset': 'processed_results_cbr.csv'}

In [9]:
# 1000 samples

{'bleu_2': 0.5396068827158336,
 'bleu_3': 0.45617526600881114,
 'bleu_4': 0.38571558598671957,
        'cosim': 0.7725588565018909,
 'dataset': 'small_validation_pe_results_p.csv'}
{'bleu_2': 0.542812939755022,
 'bleu_3': 0.45964949518984566,
 'bleu_4': 0.38905272937763996,
        'cosim': 0.7654708413731175,
 'dataset': 'small_validation_cbr_00_results_p.csv'}
{'bleu_2': 0.5513406686475593,
 'bleu_3': 0.4653106822819303,
 'bleu_4': 0.39302688807601166,
        'cosim': 0.7632422508541131,
 'dataset': 'small_validation_cbr_00_ing_results_p.csv'}
{'bleu_2': 0.5484066657634896,
 'bleu_3': 0.46442737156905955,
 'bleu_4': 0.3931165177905519,
        'cosim': 0.7621681662680856,
 'dataset': 'small_validation_cbr_00_nam_results_p.csv'}
{'bleu_2': 0.5509298184714941,
 'bleu_3': 0.4681376893134645,
 'bleu_4': 0.39796219635868374,
       'cosim': 0.7685492702758651,
 'dataset': 'small_validation_cbr_00_large_half_results_p.csv'}


print()




In [10]:
# 500 samples

{'bleu_2': 0.5426869728805064,
 'bleu_3': 0.458388462134935,
 'bleu_4': 0.3874877600270263,
 'cosim': 0.7707031342117534,
 'dataset': 'small_validation_pe_results_p.csv'}
{'bleu_2': 0.5438659346908847,
 'bleu_3': 0.46062494514966273,
 'bleu_4': 0.38978623748374275,
 'cosim': 0.7669587393039417,
 'dataset': 'small_validation_cbr_00_results_p.csv'}
{'bleu_2': 0.54496451882725,
 'bleu_3': 0.4593921251448247,
 'bleu_4': 0.38765187507372423,
 'cosim': 0.7590582257581593,
 'dataset': 'small_validation_cbr_00_ing_results_p.csv'}
{'bleu_2': 0.5460347176785251,
 'bleu_3': 0.4617148488887874,
 'bleu_4': 0.39058422725089476,
 'cosim': 0.7601030492891336,
 'dataset': 'small_validation_cbr_00_nam_results_p.csv'}

print()




In [11]:
# embedding_fun = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
# embedding_fun = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L12-v2")
# embedding_fun = HuggingFaceEmbeddings(model_name="sentence-transformers/paraphrase-MiniLM-L6-v2")
# embedding_fun = HuggingFaceEmbeddings(model_name="BAAI/bge-large-en-v1.5")
# embedding_fun = GPT4AllEmbeddings()
# embedding_fun = HuggingFaceEmbeddings()

# model = SentenceTransformer('sentence-transformers/all-MiniLM-L6-v2')

# len(embedding_fun.embed_query("sdf"))
# len(model.encode("asd"))

In [12]:
# embedding_cosine_similarity(y, pred, GPT4AllEmbeddings())

In [13]:
"""
PE -----
embedding_sim: 0.77055
embedding_sim_pf: 0.72920
HuggingFaceEmbeddings: 0.82272
bl2: 0.54114
bl3: 0.45684
bl4: 0.38604

CBR_00 -----
embedding_sim: 0.76286
embedding_sim_pf: 0.72389
HuggingFaceEmbeddings: 0.81547
bl2: 0.54043
bl3: 0.45686
bl4: 0.38614

CBR_00_ing -----
embedding_sim: 0.76121
bl2: 0.54747
bl3: 0.46198
bl4: 0.39026


CBR_00 -----
embedding_sim: 0.
bl2: 0.
bl3: 0.
bl4: 0.


old_CBR_00 -----
embedding_sim: 0.75980
bl2: 0.52887
bl3: 0.44601
bl4: 0.37680


"""

'\nPE -----\nembedding_sim: 0.77055\nembedding_sim_pf: 0.72920\nHuggingFaceEmbeddings: 0.82272\nbl2: 0.54114\nbl3: 0.45684\nbl4: 0.38604\n\nCBR_00 -----\nembedding_sim: 0.76286\nembedding_sim_pf: 0.72389\nHuggingFaceEmbeddings: 0.81547\nbl2: 0.54043\nbl3: 0.45686\nbl4: 0.38614\n\nCBR_00_ing -----\nembedding_sim: 0.76121\nbl2: 0.54747\nbl3: 0.46198\nbl4: 0.39026\n\n\nCBR_00 -----\nembedding_sim: 0.\nbl2: 0.\nbl3: 0.\nbl4: 0.\n\n\nold_CBR_00 -----\nembedding_sim: 0.75980\nbl2: 0.52887\nbl3: 0.44601\nbl4: 0.37680\n\n\n'