# MOS Stability

In [None]:
import sys
sys.path.append("/work/b0990106x/trl/vc")
import importlib
import vc
importlib.reload(vc)
from NISQA.nisqa.NISQA_model import nisqaModel
import numpy as np
import json

In [None]:
def get_reward(output_path, base_path):
    args_nisqa = {
        "mode": "predict_file",
        "pretrained_model": f"{base_path}/NISQA/weights/nisqa.tar",
        "deg": output_path,
        "data_dir": None,
        "output_dir": f"{base_path}/NISQA/result/",
        "csv_file": None,
        "csv_deg": None,
        "num_workers": 0,
        "bs": 1,
        "ms_channel": None,
    }
    args_nisqa["tr_bs_val"] = args_nisqa["bs"]
    args_nisqa["tr_num_workers"] = args_nisqa["num_workers"]
    nisqa = nisqaModel(args_nisqa)
    try:
        prediction = nisqa.predict()
        reward = float(prediction["mos_pred"].iloc[0])
        print("Reward:", reward)
        return reward
    except Exception as e:
        print("Error:", e)
        print("get_reward function end ___________________________")
        return None
    
def calculate_metrics(rewards):
    metrics = {
        "mean": np.mean(rewards),
        "median": np.median(rewards),
        "std_dev": np.std(rewards),
        "variance": np.var(rewards),
        "min": np.min(rewards),
        "max": np.max(rewards),
        "25th_percentile": np.percentile(rewards, 25),
        "75th_percentile": np.percentile(rewards, 75),
    }
    return metrics

def save_metrics(metrics, path,times, name):
    with open(f"{path}/{name}_{times}.json", "w") as f:
        json.dump(metrics, f, indent=4)

In [None]:
# base_path = "/work/b0990106x/trl"

# output_path = f"{base_path}/mos_stability"
# audio_name = "example_save_1"
# audio_path= f"{base_path}/mos_stability/{audio_name}.wav"
# times = 10

# scores = []
# for i in range(times):
#     reward = get_reward(audio_path, base_path) # output_path is the audio file path
#     scores.append(reward)

# metrics = calculate_metrics(scores)
# save_metrics(metrics, output_path, times, audio_name) # output_path is the where we save metrics

# print(metrics)

# VC Model Stability

In [None]:
from dpo_eval import eval_dpo, save_metrics, prepare_data, load_models_and_tokenizers, load_datasets, process_and_get_scores
import torch
import sys
import importlib
import torch
from transformers import BartForConditionalGeneration, AutoTokenizer
import numpy as np
import json
import os

sys.path.append("/work/b0990106x/trl/vc")
import vc
importlib.reload(vc)


In [None]:
ar_checkpoint = "lca0503/speech-chatgpt-base-ar-v2-epoch10-wotrans"
nar_checkpoint = "lca0503/speech-chatgpt-base-nar-v2-epoch4-wotrans"
device = "cuda" if torch.cuda.is_available() else "cpu"
eval_data_len = 10
# trained_model_name = ts # from model_output
# output_dir_name = ts # output audio
agent_input_dir = "/work/b0990106x/trl/data-encodec"
base_path = "/work/b0990106x/trl"

In [None]:
def load_from_json(file_path):
    with open(file_path, 'r') as f:
        data = json.load(f)
    
    all_src_encodec = [item["src_encodec"] for item in data]
    all_instruction = [item["instruction"] for item in data]
    all_tgt_encodec = [item["tgt_encodec"] for item in data]
    
    return all_src_encodec, all_instruction, all_tgt_encodec

# Usage
all_src_encodec, all_instruction, all_tgt_encodec = load_from_json('src_encodec.json')

print(len(all_src_encodec))
print(len(all_instruction))
print(len(all_tgt_encodec))
eval_data_len = len(all_src_encodec) 

In [None]:
def calculate_metrics(rewards):
    # Filter out None values
    valid_rewards = [r for r in rewards if r is not None]
    
    if len(valid_rewards) == 0:
        return {
            "mean": None,
            "median": None,
            "std_dev": None,
            "variance": None,
            "min": None,
            "max": None,
            "25th_percentile": None,
            "75th_percentile": None,
            "rewards": None,
        }
    
    metrics = {
        "mean": np.mean(valid_rewards),
        "median": np.median(valid_rewards),
        "std_dev": np.std(valid_rewards),
        "variance": np.var(valid_rewards),
        "min": np.min(valid_rewards),
        "max": np.max(valid_rewards),
        "25th_percentile": np.percentile(valid_rewards, 25),
        "75th_percentile": np.percentile(valid_rewards, 75),
        "rewards": rewards,
    }
    return metrics


def save_metrics(metrics, path,times, name):
    with open(f"{path}/{name}_{times}.json", "w") as f:
        json.dump(metrics, f, indent=4)

In [None]:
model_name = "0704-1848"
output_dir_name = f"vc_model_stability_{model_name}"
temp = f"{base_path}/output/{output_dir_name}"
if not os.path.exists(temp):
    os.makedirs(temp)

output_path = f"{base_path}/vc_stability"
# if not os.path.exists(output_path):
#     os.makedirs(output_path)

nar_model, ar_tokenizer, nar_tokenizer = load_models_and_tokenizers(ar_checkpoint, nar_checkpoint)
args_predict, test_dataset = load_datasets(base_path, output_dir_name, device)
model = BartForConditionalGeneration.from_pretrained(ar_checkpoint, return_dict=True)
trained_model = BartForConditionalGeneration.from_pretrained(f"{base_path}/model_output/{model_name}/dpo_model")
model_reward = [] 

times = 10
num_src_encodec = 10

all_metrics = {}

for idx in range(num_src_encodec):
    src_encodec = all_src_encodec[idx]
    instruction = all_instruction[idx]
    model.to(device)
    model_reward = []

    for i in range(times):
        reward = process_and_get_scores(trained_model, nar_model, ar_tokenizer, nar_tokenizer, src_encodec, instruction, args_predict, episode_counter=i)
        model_reward.append(reward)

    metrics = calculate_metrics(model_reward)
    all_metrics[f"metrics_{idx}"] = metrics

save_metrics(all_metrics, output_path, times, output_dir_name)

In [None]:
print(all_metrics)

# Temperature Test 

In [1]:
from dpo_eval import eval_dpo, save_metrics, prepare_data, load_models_and_tokenizers, load_datasets, process_and_get_scores
import torch
import sys
import importlib
import torch
from transformers import BartForConditionalGeneration, AutoTokenizer
import numpy as np
import json
import os

sys.path.append("/work/b0990106x/trl/vc")
import vc
importlib.reload(vc)


  from .autonotebook import tqdm as notebook_tqdm


<module 'vc' (<_frozen_importlib_external._NamespaceLoader object at 0x7f3db5f62560>)>

In [2]:
ar_checkpoint = "lca0503/speech-chatgpt-base-ar-v2-epoch10-wotrans"
nar_checkpoint = "lca0503/speech-chatgpt-base-nar-v2-epoch4-wotrans"
device = "cuda" if torch.cuda.is_available() else "cpu"
eval_data_len = 10
agent_input_dir = "/work/b0990106x/trl/data-encodec"
base_path = "/work/b0990106x/trl"

In [3]:
def load_from_json(file_path):
    with open(file_path, 'r') as f:
        data = json.load(f)
    
    all_src_encodec = [item["src_encodec"] for item in data]
    all_instruction = [item["instruction"] for item in data]
    all_tgt_encodec = [item["tgt_encodec"] for item in data]
    
    return all_src_encodec, all_instruction, all_tgt_encodec

# Usage
all_src_encodec, all_instruction, all_tgt_encodec = load_from_json('src_encodec.json')

print(len(all_src_encodec))
print(len(all_instruction))
print(len(all_tgt_encodec))
eval_data_len = len(all_src_encodec) 

9254
9254
9254


In [4]:
def calculate_metrics(rewards):
    # Filter out None values
    valid_rewards = [r for r in rewards if r is not None]
    
    if len(valid_rewards) == 0:
        return {
            "mean": None,
            "median": None,
            "std_dev": None,
            "variance": None,
            "min": None,
            "max": None,
            "25th_percentile": None,
            "75th_percentile": None,
            "rewards": None,
        }
    
    metrics = {
        "mean": np.mean(valid_rewards),
        "median": np.median(valid_rewards),
        "std_dev": np.std(valid_rewards),
        "variance": np.var(valid_rewards),
        "min": np.min(valid_rewards),
        "max": np.max(valid_rewards),
        "25th_percentile": np.percentile(valid_rewards, 25),
        "75th_percentile": np.percentile(valid_rewards, 75),
        "rewards": rewards,
    }
    return metrics


def save_metrics(metrics, path,times, name):
    with open(f"{path}/{name}_{times}.json", "w") as f:
        json.dump(metrics, f, indent=4)

In [5]:
model_name = "original_model_2"
output_dir_name = f"temp_test_{model_name}"
temp = f"{base_path}/output/{output_dir_name}"
if not os.path.exists(temp):
    os.makedirs(temp)

output_path = f"{base_path}/temp_test"
# if not os.path.exists(output_path):
#     os.makedirs(output_path)

nar_model, ar_tokenizer, nar_tokenizer = load_models_and_tokenizers(ar_checkpoint, nar_checkpoint)
args_predict, test_dataset = load_datasets(base_path, output_dir_name, device)
ar_model = BartForConditionalGeneration.from_pretrained(ar_checkpoint, return_dict=True)
# trained_model = BartForConditionalGeneration.from_pretrained(f"{base_path}/model_output/{model_name}/dpo_model")
temperature = 1.0
times = 10
num_src_encodec = 10

all_metrics = {}
# 1. select one src_encodec and instruction and then run inference 10 times to get 10 scores of the same temperature
# 2. Iterate through all the temperature from 0.0 to 2.0

temperature_list = [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 1.0, 1.1, 1.2, 1.3, 1.4, 1.5, 1.6, 1.7, 1.8, 1.9, 2.0]


src_encodec = all_src_encodec[0]
instruction = all_instruction[0]

for temperature in temperature_list:
    ar_model.to(device)
    model_reward = []
    print(f"Temperature: {temperature}")
    for i in range(times):
        try:
            reward = process_and_get_scores(ar_model, nar_model, ar_tokenizer, nar_tokenizer, src_encodec, instruction, args_predict, episode_counter=0, temperature = temperature)
            model_reward.append(reward)
        except Exception as e:
            print("Error:", e)
            model_reward.append(None)

    metrics = calculate_metrics(model_reward)
    all_metrics[f"temperature_{temperature}"] = metrics

save_metrics(all_metrics, output_path, times, output_dir_name)


# for idx in range(num_src_encodec):
#     src_encodec = all_src_encodec[idx]
#     instruction = all_instruction[idx]
#     model.to(device)
#     model_reward = []

#     for i in range(times):
#         reward = process_and_get_scores(ar_model, nar_model, ar_tokenizer, nar_tokenizer, src_encodec, instruction, args_predict, episode_counter=i)
#         model_reward.append(reward)

#     metrics = calculate_metrics(model_reward)
#     all_metrics[f"metrics_{idx}"] = metrics

# save_metrics(all_metrics, output_path, times, output_dir_name)



Temperature: 0.1




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4189093112945557




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4081318378448486




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2945311069488525




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2543447017669678




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.364048719406128




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2224106788635254




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.375168561935425




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3483996391296387




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.271650552749634




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1888418197631836
Temperature: 0.2




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1378731727600098




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1730329990386963




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.195197105407715




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2648892402648926




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2351834774017334




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1653850078582764




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1536543369293213




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.282884120941162




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3567607402801514




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.360053300857544
Temperature: 0.3




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3447351455688477




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.514394998550415




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.0780792236328125




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2305843830108643




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.121185302734375




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3348968029022217




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2803900241851807




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.427555799484253




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2001752853393555




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2979698181152344
Temperature: 0.4




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3041834831237793




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3272008895874023




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3799989223480225




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3288328647613525




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3991591930389404




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.421257495880127




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3224260807037354




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2291319370269775




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.375209331512451




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3929169178009033
Temperature: 0.5




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.331385612487793




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3906242847442627




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2645761966705322




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.546340227127075




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1386609077453613




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.242288589477539




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3007872104644775




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2137372493743896




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.258363962173462




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.212693691253662
Temperature: 0.6




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1721720695495605




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.330202341079712




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.0179083347320557




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.267575263977051




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4886105060577393




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.436802625656128




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4419400691986084




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.259446859359741




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4902846813201904




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4387857913970947
Temperature: 0.7




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.39819073677063




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.503331422805786




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4210987091064453




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.304758310317993




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3924355506896973




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.294095754623413




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.516859292984009




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3270785808563232




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3534252643585205




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.345350503921509
Temperature: 0.8




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.510524034500122




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 1.9777336120605469




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2629201412200928




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.280031204223633




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1928770542144775




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2487332820892334




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.298637628555298




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4043052196502686




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.213909387588501




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2499899864196777
Temperature: 0.9




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2107107639312744




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3049614429473877




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4112603664398193




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2771637439727783




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3096485137939453




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3831374645233154




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3060643672943115




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.351259469985962




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.200662612915039




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.380018949508667
Temperature: 1.0




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.434725046157837




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3713972568511963




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.280567169189453




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.5487864017486572




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.5317091941833496




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2998311519622803




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2801802158355713




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2792763710021973




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2171359062194824




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1110377311706543
Temperature: 1.1




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.195152997970581




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2680394649505615




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.244067907333374




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.269214153289795




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4398019313812256




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.376267433166504




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.301903486251831




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3494620323181152




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2005393505096436




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1589624881744385
Temperature: 1.2




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.0946662425994873




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.354818105697632




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2720491886138916




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3348515033721924




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.211221218109131




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.372511386871338




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2183921337127686




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.370466470718384




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.670482873916626




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.313345432281494
Temperature: 1.3




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2629899978637695




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2579972743988037




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.199958086013794




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4183924198150635




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.381101369857788




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.157278299331665




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.368967294692993




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4284467697143555




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.184138298034668




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4391677379608154
Temperature: 1.4




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.182769775390625




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.225294828414917




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.246568441390991




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3640410900115967




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1483724117279053




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.224385976791382




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3980765342712402




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2121169567108154




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2769105434417725




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2315690517425537
Temperature: 1.5




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1635525226593018




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1783177852630615




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.329116106033325




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.397200345993042




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.019183397293091




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.0861575603485107




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1561169624328613




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3535757064819336




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.0645852088928223




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2508606910705566
Temperature: 1.6




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2938055992126465




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.265484571456909




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.200223445892334




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 1.9949201345443726




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2365384101867676




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1572163105010986




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.126356840133667




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.209202527999878




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2439346313476562




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.136709213256836
Temperature: 1.7




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2482306957244873




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2390968799591064




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.303368330001831




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1320362091064453




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2150158882141113




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2445576190948486




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.345210075378418




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1744682788848877




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3647449016571045




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.144303798675537
Temperature: 1.8




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3159515857696533




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3111233711242676




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.24902081489563




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1718952655792236




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2431137561798096




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.203310966491699




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4889109134674072




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.235412359237671




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.0748987197875977




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 1.982914686203003
Temperature: 1.9




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1574695110321045




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.0907249450683594




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.4017984867095947




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.192504644393921




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3253228664398193




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.153745412826538




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2800753116607666




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.116288423538208




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 1.9566060304641724




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.210458517074585
Temperature: 2.0




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1020474433898926




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2153642177581787




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2908475399017334




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.26238751411438




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.1061980724334717




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.196073293685913




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.2196907997131348




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3887152671813965




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.0964345932006836




Episode 0 : audio saved to  /work/b0990106x/trl/output/temp_test_original_model_2/example_save_0.wav


  mel_basis = filters.mel(sr=sr, n_fft=n_fft, **kwargs)


Reward: 2.3229873180389404
