diff --git a/users/gaudino/experiments/conformer_att_2023/tedlium2/configs/ted2_recogs.py b/users/gaudino/experiments/conformer_att_2023/tedlium2/configs/ted2_recogs.py index 087c91e60..fafdb4441 100644 --- a/users/gaudino/experiments/conformer_att_2023/tedlium2/configs/ted2_recogs.py +++ b/users/gaudino/experiments/conformer_att_2023/tedlium2/configs/ted2_recogs.py @@ -1259,7 +1259,7 @@ def get_train_data(**kwargs): # "beam_sizes": [32, 70], # }, "model_att_only_currL": { - "scales": [(0.7, 0.3, 0.0, 1.0)], + "scales": [(0.7, 0.3, 0.3, 1.0)], }, # "model_ctc0.3_att0.7_lay6": { # "scales": [(0.8, 0.2, 0.55)], @@ -1302,9 +1302,8 @@ def get_train_data(**kwargs): # joint_training_model_names_2[first_model_name]["beam_sizes"], # joint_training_model_names_2[first_model_name]["scales"], # ): - for beam_size, prior_scale, scales in product( + for beam_size, scales in product( [32], - [0.0, 0.1 ,0.2 ,0.3, 0.4, 0.5, 0.6, 0.7], dict_sep_recombine[first_model_name]["scales"], ): search_args = copy.deepcopy(args) @@ -1317,7 +1316,7 @@ def get_train_data(**kwargs): } search_args["beam_size"] = beam_size search_args["ctc_log_prior_file"] = models["model_ctc_only"]["prior"] - att_scale, ctc_scale,_,_= scales + att_scale, ctc_scale,prior_scale,_= scales label_scale = 1.0 search_args["decoder_args"] = CTCDecoderArgs( @@ -1354,7 +1353,7 @@ def get_train_data(**kwargs): checkpoint=models[first_model_name]["ckpt"], search_args=search_args, bpe_size=BPE_1K, - test_sets=["dev"], + test_sets=["dev", "test"], remove_label={"", ""}, use_sclite=True, time_rqmt=2.0,