### 1. Settings

In [1]:
#####################################
##########  DEPENDECIES ############
#####################################

import os
import pickle
from tqdm import tqdm # type: ignore
from datetime import date

import evaluate

from transformers import AutoModelForSeq2SeqLM, AutoTokenizer

import utils.prep as pr
import utils.eval as ev
import utils.inference as infer
from utils.sampling import create_splits, prep_cv_validation
from utils.training import cv_cluster_set, cv_training_epochs_sets
from utils.training import results_dict_todf, cv_step_2, full_step_2

tqdm.pandas()
import warnings
warnings.filterwarnings("ignore")

os.environ["TOKENIZERS_PARALLELISM"] = "false"
os.environ["WANDB_DISABLED"] = "true"
os.environ["CUDA_VISIBLE_DEVICES"] = "0"

import torch
#####################################
############  CONSTANTS #############
#####################################
RS = 42

MODEL = "CodeT5"
BATCH_SIZE = 16
DECODER_LENGTH = 20
ENCODER_LENGTH = 30
ANALYSIS_POSTFIX = f"mined_no_drift_{str(date.today())}"
DATE_STR = 20240721
SEMANTIC_DRIFT = True
model_name="Salesforce/codet5-base-multi-sum"

FULL_TRAIN_ARGS = {
    "BATCH_SIZE": BATCH_SIZE,
    "DECODER_LENGTH": DECODER_LENGTH,
    "ENCODER_LENGTH": ENCODER_LENGTH,
    "MODEL": MODEL,
    "SEQ_TRAINER_ARGS": {
        "overwrite_output_dir": True,
        "num_train_epochs": [0, 1, 5, 8, 10, 16],
        "do_train": True,
        "do_eval": True,
        "per_device_train_batch_size": 4,
        "per_device_eval_batch_size": 4,
        "learning_rate": 6e-6,
        "warmup_steps": 500,
        "weight_decay": 0.1,
        "label_smoothing_factor": 0.1,
        "predict_with_generate": True,
        "logging_steps": 100,
        "save_total_limit": 1,
        "save_strategy": "no",
        "logging_strategy": "epoch",
        "evaluation_strategy": "epoch",
        "load_best_model_at_end": False,
        "output_dir" : 'reports/results',
        "logging_dir" : "reports/logs",
    },
}

tokenizer = AutoTokenizer.from_pretrained(model_name, skip_special_tokens=False)
model = AutoModelForSeq2SeqLM.from_pretrained(model_name)
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
rouge = evaluate.load('rouge')

[nltk_data] Downloading package punkt to
[nltk_data]     /home/RDC/zinovyee.hub/nltk_data...
[nltk_data]   Package punkt is already up-to-date!


### 2. Conala data. Preprocessing. 

In [2]:
experiment_config = {
    "DATE_STR" : "20240721",
    "RS" : 42,
    "DRIFT_TYPE" : "sudden",
    "NFOLD" : 3,
    "FULL_TRAIN_ARGS" : FULL_TRAIN_ARGS,
    "MODEL_NAME" : model_name,
    "ANALYSIS_POSTFIX" : ANALYSIS_POSTFIX,
    "CLUSTER_EPOCHS" : 1,
}

In [3]:
sampling_dict = create_splits(experiment_config=experiment_config, tokenizer=tokenizer, test=False)
train_dataset, test_data, test_df = sampling_dict["train_data"], sampling_dict["test_data"], sampling_dict["test_df"]

splits, questions_list = prep_cv_validation(train_dataset=train_dataset, 
                            experiment_config=experiment_config)

Train Data:  (7942, 11)
Test Data:  (2058, 11)
Train Data: Cluster cluster
2    3632
3    2204
1    1672
0     414
4      20
Name: count, dtype: int64
Test Data: Cluster cluster
4    1980
3      39
2      25
1      12
0       2
Name: count, dtype: int64


Filter:   0%|          | 0/2058 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2058 [00:00<?, ? examples/s]

Map:   0%|          | 0/2058 [00:00<?, ? examples/s]

Fold 0
Fold 1
Fold 2


In [5]:
fold_results = cv_training_epochs_sets(experiment_config=experiment_config,
                            splits=splits,
                            questions_list=questions_list,
                            train_dataset=train_dataset,
                            tokenizer=tokenizer)

Fold 0


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5298 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5298 [00:00<?, ? examples/s]

Map:   0%|          | 0/5298 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2644 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2644 [00:00<?, ? examples/s]

Map:   0%|          | 0/2644 [00:00<?, ? examples/s]

TRAINING EPOCH SET 0
TRAINING EPOCHS 0
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


TRAINING EPOCH SET 1
TRAINING EPOCHS 1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,5.1817,4.698771,0.2487,0.0616,0.2212,0.2213,14.1649,0.0215,1.0,1.1625,29444,25328


TRAINING EPOCH SET 5
TRAINING EPOCHS 4
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,4.6798,4.561677,0.2599,0.0666,0.2298,0.2299,14.1528,0.0207,1.0,1.1572,29309,25328
2,4.5816,4.505205,0.265,0.0697,0.2336,0.2335,14.0564,0.0225,1.0,1.1441,28979,25328
3,4.4846,4.484755,0.2674,0.0715,0.2352,0.2352,14.0061,0.0233,1.0,1.1344,28732,25328
4,4.4337,4.477675,0.2687,0.0728,0.2366,0.2367,14.09,0.0243,1.0,1.1442,28981,25328


TRAINING EPOCH SET 8
TRAINING EPOCHS 3
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,4.2429,4.479573,0.2658,0.0693,0.2327,0.2327,14.1483,0.0232,1.0,1.1477,29068,25328
2,4.2185,4.470181,0.2703,0.0724,0.2367,0.2366,14.0344,0.0233,1.0,1.1356,28762,25328
3,4.2043,4.4659,0.2692,0.0716,0.2354,0.2353,14.166,0.0227,1.0,1.1473,29058,25328


TRAINING EPOCH SET 10
TRAINING EPOCHS 2
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,3.9388,4.5065,0.2631,0.0672,0.2311,0.2311,14.0692,0.0224,1.0,1.136,28773,25328
2,3.9584,4.50456,0.2677,0.0696,0.234,0.2339,13.9391,0.0229,1.0,1.1237,28461,25328


TRAINING EPOCH SET 16
TRAINING EPOCHS 6
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,3.6751,4.572701,0.2582,0.0665,0.2271,0.2272,13.9482,0.0206,1.0,1.1203,28375,25328
2,3.798,4.518637,0.2659,0.0688,0.2329,0.2328,13.9939,0.0218,1.0,1.128,28571,25328
3,3.954,4.4866,0.2683,0.0709,0.235,0.2351,13.9346,0.0223,1.0,1.121,28393,25328
4,3.9976,4.47,0.2661,0.0709,0.2331,0.2333,13.924,0.0224,1.0,1.1203,28375,25328
5,3.9793,4.47636,0.2667,0.0701,0.2336,0.2337,14.0004,0.0216,1.0,1.1258,28514,25328
6,3.9533,4.479221,0.2654,0.069,0.2321,0.2323,13.9875,0.021,1.0,1.1269,28543,25328


Fold 1


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5295 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5295 [00:00<?, ? examples/s]

Map:   0%|          | 0/5295 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2647 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2647 [00:00<?, ? examples/s]

Map:   0%|          | 0/2647 [00:00<?, ? examples/s]

TRAINING EPOCH SET 0
TRAINING EPOCHS 0
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


TRAINING EPOCH SET 1
TRAINING EPOCHS 1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,5.1708,4.710202,0.2492,0.061,0.2217,0.2219,14.0385,0.0195,1.0,1.1426,29242,25592


TRAINING EPOCH SET 5
TRAINING EPOCHS 4
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,4.6706,4.571948,0.2701,0.0716,0.2375,0.2374,14.0831,0.0246,1.0,1.1401,29178,25592
2,4.571,4.509912,0.2721,0.0733,0.2382,0.2383,13.9698,0.0262,1.0,1.1286,28884,25592
3,4.4792,4.48725,0.2734,0.0733,0.2394,0.2394,14.1073,0.0253,1.0,1.138,29124,25592
4,4.4222,4.483542,0.2755,0.0734,0.2405,0.2407,14.071,0.0256,1.0,1.1332,29000,25592


TRAINING EPOCH SET 8
TRAINING EPOCHS 3
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,4.2315,4.491459,0.2759,0.0734,0.2404,0.2406,14.1711,0.0264,1.0,1.1404,29184,25592
2,4.2073,4.473559,0.2752,0.0727,0.2402,0.24,14.0608,0.0266,1.0,1.1286,28884,25592
3,4.1976,4.472107,0.2762,0.0726,0.2411,0.2411,14.0257,0.026,1.0,1.1232,28746,25592


TRAINING EPOCH SET 10
TRAINING EPOCHS 2
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,3.9242,4.526834,0.2709,0.0697,0.2367,0.2368,14.1572,0.0244,1.0,1.1351,29050,25592
2,3.9467,4.513162,0.2711,0.0693,0.2369,0.2369,13.9868,0.0241,1.0,1.1177,28603,25592


TRAINING EPOCH SET 16
TRAINING EPOCHS 6
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,3.6578,4.604552,0.2663,0.0667,0.232,0.232,14.1099,0.0224,1.0,1.1322,28975,25592
2,3.7852,4.518794,0.27,0.0692,0.2359,0.236,14.0903,0.0243,1.0,1.1323,28977,25592
3,3.9451,4.487727,0.2686,0.0697,0.2361,0.236,14.034,0.0254,1.0,1.1219,28711,25592
4,3.9782,4.487778,0.2709,0.0695,0.2365,0.2366,14.1564,0.0245,1.0,1.1368,29094,25592
5,3.9615,4.488613,0.2699,0.0701,0.2366,0.2367,14.1012,0.0247,1.0,1.1263,28825,25592
6,3.9338,4.492178,0.2697,0.0701,0.2361,0.2363,14.1371,0.0248,1.0,1.1316,28961,25592


Fold 2


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5291 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5291 [00:00<?, ? examples/s]

Map:   0%|          | 0/5291 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2651 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2651 [00:00<?, ? examples/s]

Map:   0%|          | 0/2651 [00:00<?, ? examples/s]

TRAINING EPOCH SET 0
TRAINING EPOCHS 0
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


TRAINING EPOCH SET 1
TRAINING EPOCHS 1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,5.18,4.713183,0.2403,0.0617,0.2159,0.216,14.017,0.0202,1.0,1.1579,29271,25280


TRAINING EPOCH SET 5
TRAINING EPOCHS 4
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,4.6788,4.577013,0.2608,0.0722,0.232,0.232,14.0219,0.0245,1.0,1.1485,29033,25280
2,4.5745,4.520506,0.2694,0.0738,0.238,0.2381,13.9415,0.0249,1.0,1.1382,28773,25280
3,4.4696,4.501167,0.2737,0.0753,0.2418,0.2417,14.143,0.0252,1.0,1.1571,29252,25280
4,4.4227,4.495306,0.2736,0.0751,0.2413,0.2414,14.0932,0.0245,1.0,1.1517,29114,25280


TRAINING EPOCH SET 8
TRAINING EPOCHS 3
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,4.2411,4.499412,0.2682,0.0735,0.2372,0.2372,14.0034,0.0238,1.0,1.1372,28748,25280
2,4.2089,4.486858,0.271,0.0739,0.2392,0.2392,13.9694,0.0247,1.0,1.1362,28722,25280
3,4.1886,4.485295,0.2703,0.074,0.2382,0.2383,14.0645,0.0245,1.0,1.1451,28949,25280


TRAINING EPOCH SET 10
TRAINING EPOCHS 2
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,3.9371,4.532994,0.2643,0.0704,0.2328,0.233,13.9842,0.0238,1.0,1.1303,28574,25280
2,3.9495,4.521092,0.2667,0.0705,0.2343,0.2346,13.9608,0.0235,1.0,1.1312,28596,25280


TRAINING EPOCH SET 16
TRAINING EPOCHS 6
LOADING MODEL ./tmp/
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,3.6765,4.609656,0.2598,0.0682,0.2283,0.2286,13.9834,0.023,1.0,1.1252,28446,25280
2,3.79,4.533356,0.2671,0.0718,0.2344,0.2345,13.7842,0.0244,1.0,1.1131,28140,25280
3,3.9354,4.508908,0.2696,0.0724,0.2365,0.2366,14.0634,0.025,1.0,1.1408,28840,25280
4,3.9802,4.49993,0.2669,0.0714,0.235,0.2351,13.9694,0.0243,1.0,1.1322,28621,25280
5,3.964,4.499954,0.2673,0.0715,0.2345,0.2345,14.1203,0.0245,1.0,1.1453,28953,25280
6,3.9399,4.503712,0.2669,0.0715,0.2342,0.2342,14.0415,0.0248,1.0,1.1388,28789,25280


In [11]:
for cluster_idx in [1, 4, 3]:
    fold_results = cv_cluster_set(experiment_config=experiment_config,
                                    splits=splits,
                                    questions_list=questions_list,
                                    train_dataset=train_dataset,
                                    tokenizer=tokenizer,
                                    fold_results=fold_results,
                                    cluster_id=cluster_idx)

cv_df = results_dict_todf(fold_results)

########## SAVE THE FILE

with open(f'reports/results/cv_result_{ANALYSIS_POSTFIX}.pickle', 'wb') as handle:
    pickle.dump(cv_df, handle, protocol=pickle.HIGHEST_PROTOCOL)

Filter:   0%|          | 0/5291 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5291 [00:00<?, ? examples/s]

Map:   0%|          | 0/5291 [00:00<?, ? examples/s]

Fold 0


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2644 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2644 [00:00<?, ? examples/s]

Map:   0%|          | 0/2644 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 1 FOR EPOCHS1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,5.1146,4.729678,0.2347,0.0545,0.2096,0.2097,13.2349,0.0193,1.0,1.0765,27266,25328


Fold 1


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2647 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2647 [00:00<?, ? examples/s]

Map:   0%|          | 0/2647 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 1 FOR EPOCHS1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Fold 2


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2651 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2651 [00:00<?, ? examples/s]

Map:   0%|          | 0/2651 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 1 FOR EPOCHS1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Filter:   0%|          | 0/5291 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5291 [00:00<?, ? examples/s]

Map:   0%|          | 0/5291 [00:00<?, ? examples/s]

Fold 0


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2644 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2644 [00:00<?, ? examples/s]

Map:   0%|          | 0/2644 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 4 FOR EPOCHS1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,5.0557,4.754361,0.2208,0.0498,0.1961,0.1962,12.5291,0.0173,1.0,1.0224,25895,25328


Fold 1


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2647 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2647 [00:00<?, ? examples/s]

Map:   0%|          | 0/2647 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 4 FOR EPOCHS1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Fold 2


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2651 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2651 [00:00<?, ? examples/s]

Map:   0%|          | 0/2651 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 4 FOR EPOCHS1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Filter:   0%|          | 0/5291 [00:00<?, ? examples/s]

Filter:   0%|          | 0/5291 [00:00<?, ? examples/s]

Map:   0%|          | 0/5291 [00:00<?, ? examples/s]

Fold 0


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2644 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2644 [00:00<?, ? examples/s]

Map:   0%|          | 0/2644 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 3 FOR EPOCHS1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Epoch,Training Loss,Validation Loss,Rouge1,Rouge2,Rougel,Rougelsum,Gen Len,Bleu,Brevity Penalty,Length Ratio,Translation Length,Reference Length
1,5.109,4.724148,0.2268,0.0532,0.2,0.2002,13.2281,0.0171,1.0,1.0872,27537,25328


Fold 1


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2647 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2647 [00:00<?, ? examples/s]

Map:   0%|          | 0/2647 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 3 FOR EPOCHS1
LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


Fold 2


Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/7942 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2651 [00:00<?, ? examples/s]

Filter:   0%|          | 0/2651 [00:00<?, ? examples/s]

Map:   0%|          | 0/2651 [00:00<?, ? examples/s]

TRAINING CLUSTER SET 3 FOR EPOCHS1


Using the `WANDB_DISABLED` environment variable is deprecated and will be removed in v5. Use the --report_to flag to control the integrations used for logging result (for instance --report_to none).


LOADING MODEL Salesforce/codet5-base-multi-sum
cuda


In [12]:
fold_results.keys()

dict_keys([0, 1, 5, 8, 10, 16, 'cluster_1', 'cluster_4', 'cluster_3'])

In [13]:
print("Mean")
print(cv_df.groupby(["model_set"])["rouge"].mean())

print("STD")
print(cv_df.groupby("model_set")["rouge"].std())

Mean
model_set
0            0.113737
1            0.247452
5            0.273484
8            0.273170
10           0.270033
16           0.268677
cluster_1    0.154332
cluster_3    0.151154
cluster_4    0.149859
Name: rouge, dtype: float64
STD
model_set
0            0.124526
1            0.157347
5            0.158682
8            0.158973
10           0.158828
16           0.158742
cluster_1    0.148038
cluster_3    0.146543
cluster_4    0.145705
Name: rouge, dtype: float64


In [6]:
########## LOAD CV RESULTS

import pickle
with open(f'reports/results/cv_result_{ANALYSIS_POSTFIX}.pickle', 'rb') as handle:
    cv_df = pickle.load(handle)

### Step 2. Learn performance

In [None]:
cv_df, model_results = cv_step_2(experiment_config=experiment_config, cv_df=cv_df)

with open(f'reports/results/s2_model_results_{ANALYSIS_POSTFIX}.pickle', 'wb') as handle:
    pickle.dump(model_results, handle, protocol=pickle.HIGHEST_PROTOCOL)

with open(f'reports/results/cd_df_with_s2_{ANALYSIS_POSTFIX}.pickle', 'wb') as handle:
    pickle.dump(cv_df, handle, protocol=pickle.HIGHEST_PROTOCOL)

print("Mean")
print(cv_df.groupby(["model_set"])["rouge"].mean())

print("STD")
print(cv_df.groupby("model_set")["rouge"].std())

0
lr
svm


In [4]:
### TO SAVE THE VECTORIZER AND STEP 2 MODELS

with open(f'reports/results/cd_df_with_s2_{ANALYSIS_POSTFIX}.pickle', 'rb') as handle:
    cv_df = pickle.load(handle)

In [5]:
full_step_2(cv_df=cv_df, 
            experiment_config=experiment_config)

lr
svm
lgbm
[LightGBM] [Info] Auto-choosing row-wise multi-threading, the overhead of testing was 4.989763 seconds.
You can set `force_row_wise=true` to remove the overhead.
And if memory is not enough, you can set `force_col_wise=true`.
[LightGBM] [Info] Total Bins 21187
[LightGBM] [Info] Number of data points in the train set: 71478, number of used features: 1422
[LightGBM] [Info] Start training from score 0.211322
catboost
Learning rate set to 0.080378
0:	learn: 0.1619674	total: 68.3ms	remaining: 1m 8s
1:	learn: 0.1603686	total: 82.6ms	remaining: 41.2s
2:	learn: 0.1590035	total: 94.8ms	remaining: 31.5s
3:	learn: 0.1578352	total: 106ms	remaining: 26.4s
4:	learn: 0.1568431	total: 116ms	remaining: 23.1s
5:	learn: 0.1559708	total: 127ms	remaining: 21s
6:	learn: 0.1552563	total: 137ms	remaining: 19.5s
7:	learn: 0.1545913	total: 148ms	remaining: 18.4s
8:	learn: 0.1540291	total: 159ms	remaining: 17.5s
9:	learn: 0.1535557	total: 170ms	remaining: 16.8s
10:	learn: 0.1531613	total: 180ms	remai