In [1]:
import os

from trainer import Trainer, TrainerArgs

from TTS.config.shared_configs import BaseAudioConfig
from TTS.tts.configs.glow_tts_config import GlowTTSConfig
from TTS.tts.configs.shared_configs import BaseDatasetConfig
from TTS.tts.datasets import load_tts_samples
from TTS.tts.models.glow_tts import GlowTTS
from TTS.tts.utils.speakers import SpeakerManager
from TTS.tts.utils.text.tokenizer import TTSTokenizer
from TTS.utils.audio import AudioProcessor



In [2]:
dataset_path = 'D:\data\TIMIT\TRAIN'
output_path = 'D:\data\TIMIT'

In [3]:
# define dataset config
# need to use vctk_old format if using wav files instead of flac

dataset_config = BaseDatasetConfig(name="vctk_old", meta_file_train="", language='en-us', path=dataset_path)

In [4]:
# define audio config

audio_config = BaseAudioConfig(sample_rate=22050,
                               preemphasis=0.98,
                               power=1.2,
                               ref_level_db=2,
                               resample=True, 
                               do_trim_silence=False, 
                               trim_db=23.0)

In [6]:
# define model config

config = GlowTTSConfig(
    batch_size=64,
    eval_batch_size=16,
    num_loader_workers=0,
    num_eval_loader_workers=0,
    precompute_num_workers=0,
    run_eval=True,
    test_delay_epochs=-1,
    epochs=1000,
    text_cleaner="phoneme_cleaners",
    use_phonemes=True,
    phoneme_language="en-us",
    phoneme_cache_path=os.path.join(output_path, "phoneme_cache"),
    print_step=25,
    print_eval=False,
    mixed_precision=True,
    output_path=output_path,
    datasets=[dataset_config],
    use_speaker_embedding=True,
    min_text_len=0,
    max_text_len=500,
    min_audio_len=0,
    max_audio_len=500000,
)

In [7]:
# INITIALIZE THE AUDIO PROCESSOR
# Audio processor is used for feature extraction and audio I/O.
# It mainly serves to the dataloader and the training loggers.
ap = AudioProcessor.init_from_config(audio_config)

 > Setting up Audio Processor...
 | > sample_rate:22050
 | > resample:True
 | > num_mels:80
 | > log_func:np.log10
 | > min_level_db:-100
 | > frame_shift_ms:None
 | > frame_length_ms:None
 | > ref_level_db:2
 | > fft_size:1024
 | > power:1.2
 | > preemphasis:0.98
 | > griffin_lim_iters:60
 | > signal_norm:True
 | > symmetric_norm:True
 | > mel_fmin:0
 | > mel_fmax:None
 | > pitch_fmin:0.0
 | > pitch_fmax:640.0
 | > spec_gain:20.0
 | > stft_pad_mode:reflect
 | > max_norm:4.0
 | > clip_norm:True
 | > do_trim_silence:False
 | > trim_db:23.0
 | > do_sound_norm:False
 | > do_amp_to_db_linear:True
 | > do_amp_to_db_mel:True
 | > do_rms_norm:False
 | > db_level:None
 | > stats_path:None
 | > base:10
 | > hop_length:256
 | > win_length:1024


In [8]:
# INITIALIZE THE TOKENIZER
# Tokenizer is used to convert text to sequences of token IDs.
# If characters are not defined in the config, default characters are passed to the config
tokenizer, config = TTSTokenizer.init_from_config(config)

In [9]:
# LOAD DATA SAMPLES
# Each sample is a list of ```[text, audio_file_path, speaker_name]```

train_samples, eval_samples = load_tts_samples(
    dataset_config,
    eval_split=True,
    eval_split_max_size=config.eval_split_max_size,
    eval_split_size=config.eval_split_size,
)

 | > Found 140 files in D:\data\TIMIT\TRAIN


In [10]:
# init speaker manager for multi-speaker training

speaker_manager = SpeakerManager()
speaker_manager.set_ids_from_data(train_samples + eval_samples, parse_key="speaker_name")
config.num_speakers = speaker_manager.num_speakers

In [11]:
# init model
model = GlowTTS(config, ap, tokenizer, speaker_manager=speaker_manager)

 > Init speaker_embedding layer.


In [12]:
# INITIALIZE THE TRAINER

trainer = Trainer(
    TrainerArgs(), config, output_path, model=model, train_samples=train_samples, eval_samples=eval_samples
)

 > Using CUDA: True
 > Number of GPUs: 1

 > Model has 32336209 parameters


 > `speakers.pth` is saved to D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\speakers.pth.
 > `speakers_file` is updated in the config.json.


In [13]:
trainer.fit()


[4m[1m > EPOCH: 0/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:29:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 0[0m
     | > current_lr: 0.00000 
     | > step_time: 1.56420  (1.56416)
     | > loader_time: 0.47860  (0.47858)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
ðə tu ɑɹtɪsts ɪkst͡ʃeɪnd͡ʒd ɔtoʊɡɹæfs.
 [!] Character '͡' not found in the vocabulary. Discarding it.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.37734 [0m(+0.00000)
     | > avg_loss: 2.82171 [0m(+0.00000)
     | > avg_log_mle: 0.65565 [0m(+0.00000)
     | > avg_loss_dur: 2.16606 [0m(+0.00000)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_3.pth

[4m[1m > EPOCH: 1/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:29:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01501 [0m(-0.36233)
     | > avg_loss: 2.82171 [0m(+0.00000)
     | > avg_log_mle: 0.65565 [0m(+0.00000)
     | > avg_loss_dur: 2.16606 [0m(+0.00000)


[4m[1m > EPOCH: 2/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:29:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01101 [0m(-0.00400)
     | > avg_loss: 2.82171 [0m(+0.00000)
     | > avg_log_mle: 0.65565 [0m(+0.00000)
     | > avg_loss_dur: 2.16606 [0m(+0.00000)


[4m[1m > EPOCH: 3/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:29:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[92m 2.81372 [0m(-0.00798)
     | > avg_log_mle:[92m 0.65264 [0m(-0.00301)
     | > avg_loss_dur:[92m 2.16108 [0m(-0.00497)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_12.pth

[4m[1m > EPOCH: 4/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:29:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.81358 [0m(-0.00014)
     | > avg_log_mle:[92m 0.65264 [0m(-0.00000)
     | > avg_loss_dur:[92m 2.16095 [0m(-0.00014)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_15.pth

[4m[1m > EPOCH: 5/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:29:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 2.81339 [0m(-0.00019)
     | > avg_log_mle:[92m 0.65263 [0m(-0.00001)
     | > avg_loss_dur:[92m 2.16076 [0m(-0.00018)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_18.pth

[4m[1m > EPOCH: 6/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:30:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.81297 [0m(-0.00042)
     | > avg_log_mle:[92m 0.65259 [0m(-0.00003)
     | > avg_loss_dur:[92m 2.16038 [0m(-0.00039)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_21.pth

[4m[1m > EPOCH: 7/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:30:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.81229 [0m(-0.00068)
     | > avg_log_mle:[92m 0.65254 [0m(-0.00006)
     | > avg_loss_dur:[92m 2.15975 [0m(-0.00062)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_24.pth

[4m[1m > EPOCH: 8/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:30:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 25[0m
     | > loss: 2.29974  (2.29974)
     | > log_mle: 0.58258  (0.58258)
     | > loss_dur: 1.71715  (1.71715)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.25363  (8.25363)
     | > current_lr: 0.00000 
     | > step_time: 1.08940  (1.08937)
     | > loader_time: 0.42340  (0.42338)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 2.81135 [0m(-0.00094)
     | > avg_log_mle:[92m 0.65246 [0m(-0.00008)
     | > avg_loss_dur:[92m 2.15889 [0m(-0.00087)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_27.pth

[4m[1m > EPOCH: 9/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:30:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.81013 [0m(-0.00122)
     | > avg_log_mle:[92m 0.65236 [0m(-0.00010)
     | > avg_loss_dur:[92m 2.15777 [0m(-0.00112)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_30.pth

[4m[1m > EPOCH: 10/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:30:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 2.80862 [0m(-0.00151)
     | > avg_log_mle:[92m 0.65223 [0m(-0.00013)
     | > avg_loss_dur:[92m 2.15639 [0m(-0.00138)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_33.pth

[4m[1m > EPOCH: 11/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:30:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[92m 2.80678 [0m(-0.00184)
     | > avg_log_mle:[92m 0.65208 [0m(-0.00015)
     | > avg_loss_dur:[92m 2.15470 [0m(-0.00169)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_36.pth

[4m[1m > EPOCH: 12/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:30:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.80461 [0m(-0.00217)
     | > avg_log_mle:[92m 0.65190 [0m(-0.00018)
     | > avg_loss_dur:[92m 2.15271 [0m(-0.00199)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_39.pth

[4m[1m > EPOCH: 13/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:31:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.80213 [0m(-0.00249)
     | > avg_log_mle:[92m 0.65170 [0m(-0.00021)
     | > avg_loss_dur:[92m 2.15043 [0m(-0.00228)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_42.pth

[4m[1m > EPOCH: 14/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:31:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.79929 [0m(-0.00284)
     | > avg_log_mle:[92m 0.65146 [0m(-0.00024)
     | > avg_loss_dur:[92m 2.14783 [0m(-0.00260)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_45.pth

[4m[1m > EPOCH: 15/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:31:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.79611 [0m(-0.00318)
     | > avg_log_mle:[92m 0.65119 [0m(-0.00027)
     | > avg_loss_dur:[92m 2.14492 [0m(-0.00291)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_48.pth

[4m[1m > EPOCH: 16/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:31:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 50[0m
     | > loss: 2.43811  (2.36504)
     | > log_mle: 0.57656  (0.57892)
     | > loss_dur: 1.86154  (1.78612)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 9.17145  (8.68049)
     | > current_lr: 0.00000 
     | > step_time: 0.40440  (0.72316)
     | > loader_time: 0.10110  (0.26724)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.79259 [0m(-0.00352)
     | > avg_log_mle:[92m 0.65090 [0m(-0.00030)
     | > avg_loss_dur:[92m 2.14170 [0m(-0.00322)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_51.pth

[4m[1m > EPOCH: 17/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:31:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.78875 [0m(-0.00384)
     | > avg_log_mle:[92m 0.65057 [0m(-0.00033)
     | > avg_loss_dur:[92m 2.13818 [0m(-0.00351)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_54.pth

[4m[1m > EPOCH: 18/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:31:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.78457 [0m(-0.00418)
     | > avg_log_mle:[92m 0.65020 [0m(-0.00036)
     | > avg_loss_dur:[92m 2.13437 [0m(-0.00381)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_57.pth

[4m[1m > EPOCH: 19/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:31:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.78008 [0m(-0.00449)
     | > avg_log_mle:[92m 0.64980 [0m(-0.00040)
     | > avg_loss_dur:[92m 2.13027 [0m(-0.00410)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_60.pth

[4m[1m > EPOCH: 20/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:32:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.77525 [0m(-0.00483)
     | > avg_log_mle:[92m 0.64937 [0m(-0.00043)
     | > avg_loss_dur:[92m 2.12588 [0m(-0.00439)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_63.pth

[4m[1m > EPOCH: 21/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:32:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.76321 [0m(-0.01204)
     | > avg_log_mle:[92m 0.64890 [0m(-0.00047)
     | > avg_loss_dur:[92m 2.11431 [0m(-0.01157)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_66.pth

[4m[1m > EPOCH: 22/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:32:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 2.75775 [0m(-0.00547)
     | > avg_log_mle:[92m 0.64839 [0m(-0.00051)
     | > avg_loss_dur:[92m 2.10936 [0m(-0.00496)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_69.pth

[4m[1m > EPOCH: 23/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:32:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 2.75199 [0m(-0.00576)
     | > avg_log_mle:[92m 0.64784 [0m(-0.00055)
     | > avg_loss_dur:[92m 2.10415 [0m(-0.00521)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_72.pth

[4m[1m > EPOCH: 24/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:32:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[92m 2.74589 [0m(-0.00610)
     | > avg_log_mle:[92m 0.64725 [0m(-0.00059)
     | > avg_loss_dur:[92m 2.09865 [0m(-0.00550)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_75.pth

[4m[1m > EPOCH: 25/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:32:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 75[0m
     | > loss: 2.18137  (2.18137)
     | > log_mle: 0.56456  (0.56456)
     | > loss_dur: 1.61681  (1.61681)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.99229  (7.99229)
     | > current_lr: 0.00001 
     | > step_time: 0.74370  (0.74368)
     | > loader_time: 0.32430  (0.32429)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.73930 [0m(-0.00659)
     | > avg_log_mle:[92m 0.64661 [0m(-0.00064)
     | > avg_loss_dur:[92m 2.09269 [0m(-0.00595)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_78.pth

[4m[1m > EPOCH: 26/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:32:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.73222 [0m(-0.00707)
     | > avg_log_mle:[92m 0.64592 [0m(-0.00069)
     | > avg_loss_dur:[92m 2.08630 [0m(-0.00639)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_81.pth

[4m[1m > EPOCH: 27/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:32:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.72498 [0m(-0.00724)
     | > avg_log_mle:[92m 0.64519 [0m(-0.00074)
     | > avg_loss_dur:[92m 2.07980 [0m(-0.00651)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_84.pth

[4m[1m > EPOCH: 28/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:33:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.71746 [0m(-0.00752)
     | > avg_log_mle:[92m 0.64440 [0m(-0.00079)
     | > avg_loss_dur:[92m 2.07307 [0m(-0.00673)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_87.pth

[4m[1m > EPOCH: 29/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:33:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.66508 [0m(-0.05238)
     | > avg_log_mle:[92m 0.64355 [0m(-0.00085)
     | > avg_loss_dur:[92m 2.02153 [0m(-0.05154)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_90.pth

[4m[1m > EPOCH: 30/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:33:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.65600 [0m(-0.00908)
     | > avg_log_mle:[92m 0.64264 [0m(-0.00091)
     | > avg_loss_dur:[92m 2.01336 [0m(-0.00817)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_93.pth

[4m[1m > EPOCH: 31/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:33:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.64718 [0m(-0.00882)
     | > avg_log_mle:[92m 0.64167 [0m(-0.00097)
     | > avg_loss_dur:[92m 2.00551 [0m(-0.00785)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_96.pth

[4m[1m > EPOCH: 32/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:33:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.63748 [0m(-0.00970)
     | > avg_log_mle:[92m 0.64063 [0m(-0.00104)
     | > avg_loss_dur:[92m 1.99685 [0m(-0.00866)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_99.pth

[4m[1m > EPOCH: 33/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:33:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 100[0m
     | > loss: 2.20255  (2.20255)
     | > log_mle: 0.57348  (0.57348)
     | > loss_dur: 1.62907  (1.62907)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.52226  (7.52226)
     | > current_lr: 0.00001 
     | > step_time: 1.16810  (1.16806)
     | > loader_time: 0.44140  (0.44140)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.62710 [0m(-0.01038)
     | > avg_log_mle:[92m 0.63951 [0m(-0.00112)
     | > avg_loss_dur:[92m 1.98759 [0m(-0.00926)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_102.pth

[4m[1m > EPOCH: 34/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:33:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.61584 [0m(-0.01127)
     | > avg_log_mle:[92m 0.63830 [0m(-0.00121)
     | > avg_loss_dur:[92m 1.97753 [0m(-0.01006)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_105.pth

[4m[1m > EPOCH: 35/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:34:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.60373 [0m(-0.01211)
     | > avg_log_mle:[92m 0.63700 [0m(-0.00130)
     | > avg_loss_dur:[92m 1.96673 [0m(-0.01081)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_108.pth

[4m[1m > EPOCH: 36/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:34:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 2.59097 [0m(-0.01276)
     | > avg_log_mle:[92m 0.63561 [0m(-0.00140)
     | > avg_loss_dur:[92m 1.95536 [0m(-0.01137)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_111.pth

[4m[1m > EPOCH: 37/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:34:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01069 [0m(-0.00032)
     | > avg_loss:[92m 2.57732 [0m(-0.01365)
     | > avg_log_mle:[92m 0.63411 [0m(-0.00150)
     | > avg_loss_dur:[92m 1.94321 [0m(-0.01215)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_114.pth

[4m[1m > EPOCH: 38/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:34:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00068)
     | > avg_loss:[92m 2.56183 [0m(-0.01548)
     | > avg_log_mle:[92m 0.63249 [0m(-0.00161)
     | > avg_loss_dur:[92m 1.92934 [0m(-0.01387)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_117.pth

[4m[1m > EPOCH: 39/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:34:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 2.54494 [0m(-0.01689)
     | > avg_log_mle:[92m 0.63076 [0m(-0.00173)
     | > avg_loss_dur:[92m 1.91418 [0m(-0.01516)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_120.pth

[4m[1m > EPOCH: 40/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:34:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.52720 [0m(-0.01774)
     | > avg_log_mle:[92m 0.62890 [0m(-0.00186)
     | > avg_loss_dur:[92m 1.89831 [0m(-0.01588)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_123.pth

[4m[1m > EPOCH: 41/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:34:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 125[0m
     | > loss: 2.25605  (2.18076)
     | > log_mle: 0.55756  (0.56097)
     | > loss_dur: 1.69850  (1.61978)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.44227  (7.10370)
     | > current_lr: 0.00001 
     | > step_time: 0.40340  (0.72616)
     | > loader_time: 0.10410  (0.26474)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.51342 [0m(-0.01379)
     | > avg_log_mle:[92m 0.62689 [0m(-0.00200)
     | > avg_loss_dur:[92m 1.88652 [0m(-0.01178)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_126.pth

[4m[1m > EPOCH: 42/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:35:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00300)
     | > avg_loss:[92m 2.49297 [0m(-0.02044)
     | > avg_log_mle:[92m 0.62473 [0m(-0.00216)
     | > avg_loss_dur:[92m 1.86824 [0m(-0.01828)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_129.pth

[4m[1m > EPOCH: 43/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:35:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01101 [0m(-0.00100)
     | > avg_loss:[92m 2.47182 [0m(-0.02115)
     | > avg_log_mle:[92m 0.62241 [0m(-0.00232)
     | > avg_loss_dur:[92m 1.84941 [0m(-0.01883)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_132.pth

[4m[1m > EPOCH: 44/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:35:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01158 [0m(+0.00057)
     | > avg_loss:[92m 2.45006 [0m(-0.02177)
     | > avg_log_mle:[92m 0.61991 [0m(-0.00250)
     | > avg_loss_dur:[92m 1.83014 [0m(-0.01927)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_135.pth

[4m[1m > EPOCH: 45/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:35:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01067 [0m(-0.00091)
     | > avg_loss:[92m 2.42815 [0m(-0.02190)
     | > avg_log_mle:[92m 0.61723 [0m(-0.00268)
     | > avg_loss_dur:[92m 1.81093 [0m(-0.01922)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_138.pth

[4m[1m > EPOCH: 46/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:35:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00134)
     | > avg_loss:[92m 2.40694 [0m(-0.02121)
     | > avg_log_mle:[92m 0.61434 [0m(-0.00289)
     | > avg_loss_dur:[92m 1.79260 [0m(-0.01833)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_141.pth

[4m[1m > EPOCH: 47/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:35:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00200)
     | > avg_loss:[92m 2.38660 [0m(-0.02034)
     | > avg_log_mle:[92m 0.61124 [0m(-0.00310)
     | > avg_loss_dur:[92m 1.77536 [0m(-0.01724)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_144.pth

[4m[1m > EPOCH: 48/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:36:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 2.36742 [0m(-0.01918)
     | > avg_log_mle:[92m 0.60791 [0m(-0.00333)
     | > avg_loss_dur:[92m 1.75951 [0m(-0.01585)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_147.pth

[4m[1m > EPOCH: 49/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:36:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 2.34997 [0m(-0.01745)
     | > avg_log_mle:[92m 0.60435 [0m(-0.00356)
     | > avg_loss_dur:[92m 1.74562 [0m(-0.01389)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_150.pth

[4m[1m > EPOCH: 50/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:36:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 150[0m
     | > loss: 1.88637  (1.88637)
     | > log_mle: 0.53175  (0.53175)
     | > loss_dur: 1.35462  (1.35462)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.22241  (5.22241)
     | > current_lr: 0.00001 
     | > step_time: 1.16140  (1.16139)
     | > loader_time: 0.37270  (0.37272)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01301 [0m(+0.00200)
     | > avg_loss:[92m 2.33374 [0m(-0.01622)
     | > avg_log_mle:[92m 0.60053 [0m(-0.00382)
     | > avg_loss_dur:[92m 1.73321 [0m(-0.01241)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_153.pth

[4m[1m > EPOCH: 51/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:36:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01120 [0m(-0.00182)
     | > avg_loss:[92m 2.33020 [0m(-0.00354)
     | > avg_log_mle:[92m 0.59644 [0m(-0.00409)
     | > avg_loss_dur:[91m 1.73376 [0m(+0.00055)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_156.pth

[4m[1m > EPOCH: 52/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:36:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01101 [0m(-0.00018)
     | > avg_loss:[92m 2.31506 [0m(-0.01514)
     | > avg_log_mle:[92m 0.59207 [0m(-0.00437)
     | > avg_loss_dur:[92m 1.72299 [0m(-0.01077)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_159.pth

[4m[1m > EPOCH: 53/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:36:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01101 [0m(-0.00000)
     | > avg_loss:[92m 2.29962 [0m(-0.01543)
     | > avg_log_mle:[92m 0.58743 [0m(-0.00464)
     | > avg_loss_dur:[92m 1.71219 [0m(-0.01079)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_162.pth

[4m[1m > EPOCH: 54/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:36:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00972 [0m(-0.00129)
     | > avg_loss:[92m 2.28365 [0m(-0.01598)
     | > avg_log_mle:[92m 0.58252 [0m(-0.00491)
     | > avg_loss_dur:[92m 1.70113 [0m(-0.01106)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_165.pth

[4m[1m > EPOCH: 55/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:37:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01269 [0m(+0.00297)
     | > avg_loss:[92m 2.25884 [0m(-0.02480)
     | > avg_log_mle:[92m 0.57731 [0m(-0.00521)
     | > avg_loss_dur:[92m 1.68154 [0m(-0.01959)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_168.pth

[4m[1m > EPOCH: 56/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:37:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01087 [0m(-0.00182)
     | > avg_loss:[92m 2.24126 [0m(-0.01758)
     | > avg_log_mle:[92m 0.57180 [0m(-0.00551)
     | > avg_loss_dur:[92m 1.66947 [0m(-0.01207)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_171.pth

[4m[1m > EPOCH: 57/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:37:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01512 [0m(+0.00425)
     | > avg_loss:[92m 2.22220 [0m(-0.01906)
     | > avg_log_mle:[92m 0.56600 [0m(-0.00580)
     | > avg_loss_dur:[92m 1.65620 [0m(-0.01326)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_174.pth

[4m[1m > EPOCH: 58/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:37:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 175[0m
     | > loss: 1.92024  (1.92024)
     | > log_mle: 0.51416  (0.51416)
     | > loss_dur: 1.40608  (1.40608)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.83043  (4.83043)
     | > current_lr: 0.00001 
     | > step_time: 1.39490  (1.39490)
     | > loader_time: 0.47110  (0.47110)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00941 [0m(-0.00571)
     | > avg_loss:[91m 2.24204 [0m(+0.01983)
     | > avg_log_mle:[92m 0.55994 [0m(-0.00606)
     | > avg_loss_dur:[91m 1.68210 [0m(+0.02590)


[4m[1m > EPOCH: 59/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:37:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00040)
     | > avg_loss:[92m 2.21996 [0m(-0.02207)
     | > avg_log_mle:[92m 0.55362 [0m(-0.00632)
     | > avg_loss_dur:[92m 1.66635 [0m(-0.01575)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_180.pth

[4m[1m > EPOCH: 60/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:37:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.19738 [0m(-0.02259)
     | > avg_log_mle:[92m 0.54705 [0m(-0.00656)
     | > avg_loss_dur:[92m 1.65032 [0m(-0.01602)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_183.pth

[4m[1m > EPOCH: 61/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 2.47295 [0m(+0.27558)
     | > avg_log_mle:[92m 0.54023 [0m(-0.00682)
     | > avg_loss_dur:[91m 1.93272 [0m(+0.28240)


[4m[1m > EPOCH: 62/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.44640 [0m(-0.02655)
     | > avg_log_mle:[92m 0.53304 [0m(-0.00719)
     | > avg_loss_dur:[92m 1.91336 [0m(-0.01936)


[4m[1m > EPOCH: 63/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.41927 [0m(-0.02713)
     | > avg_log_mle:[92m 0.52558 [0m(-0.00746)
     | > avg_loss_dur:[92m 1.89370 [0m(-0.01967)


[4m[1m > EPOCH: 64/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.39081 [0m(-0.02846)
     | > avg_log_mle:[92m 0.51790 [0m(-0.00767)
     | > avg_loss_dur:[92m 1.87291 [0m(-0.02079)


[4m[1m > EPOCH: 65/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.20797 [0m(-0.18284)
     | > avg_log_mle:[92m 0.50997 [0m(-0.00793)
     | > avg_loss_dur:[92m 1.69800 [0m(-0.17491)


[4m[1m > EPOCH: 66/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 200[0m
     | > loss: 1.79150  (1.76763)
     | > log_mle: 0.45526  (0.46449)
     | > loss_dur: 1.33624  (1.30314)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.72255  (4.54348)
     | > current_lr: 0.00002 
     | > step_time: 0.39640  (0.73166)
     | > loader_time: 0.10910  (0.27375)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.15764 [0m(-0.05033)
     | > avg_log_mle:[92m 0.50177 [0m(-0.00820)
     | > avg_loss_dur:[92m 1.65587 [0m(-0.04213)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_201.pth

[4m[1m > EPOCH: 67/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 2.12636 [0m(-0.03128)
     | > avg_log_mle:[92m 0.49343 [0m(-0.00834)
     | > avg_loss_dur:[92m 1.63293 [0m(-0.02294)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_204.pth

[4m[1m > EPOCH: 68/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.09624 [0m(-0.03012)
     | > avg_log_mle:[92m 0.48503 [0m(-0.00839)
     | > avg_loss_dur:[92m 1.61121 [0m(-0.02172)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_207.pth

[4m[1m > EPOCH: 69/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:38:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 2.06085 [0m(-0.03540)
     | > avg_log_mle:[92m 0.47662 [0m(-0.00842)
     | > avg_loss_dur:[92m 1.58423 [0m(-0.02698)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_210.pth

[4m[1m > EPOCH: 70/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:39:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[92m 2.02993 [0m(-0.03091)
     | > avg_log_mle:[92m 0.46818 [0m(-0.00843)
     | > avg_loss_dur:[92m 1.56175 [0m(-0.02248)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_213.pth

[4m[1m > EPOCH: 71/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:39:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 1.99956 [0m(-0.03038)
     | > avg_log_mle:[92m 0.45975 [0m(-0.00843)
     | > avg_loss_dur:[92m 1.53980 [0m(-0.02195)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_216.pth

[4m[1m > EPOCH: 72/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:39:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 1.96972 [0m(-0.02984)
     | > avg_log_mle:[92m 0.45136 [0m(-0.00839)
     | > avg_loss_dur:[92m 1.51836 [0m(-0.02144)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_219.pth

[4m[1m > EPOCH: 73/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:39:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00300)
     | > avg_loss:[92m 1.93953 [0m(-0.03019)
     | > avg_log_mle:[92m 0.44305 [0m(-0.00831)
     | > avg_loss_dur:[92m 1.49648 [0m(-0.02188)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_222.pth

[4m[1m > EPOCH: 74/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:39:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00300)
     | > avg_loss:[92m 1.90798 [0m(-0.03155)
     | > avg_log_mle:[92m 0.43483 [0m(-0.00821)
     | > avg_loss_dur:[92m 1.47315 [0m(-0.02333)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_225.pth

[4m[1m > EPOCH: 75/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:39:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 225[0m
     | > loss: 1.41578  (1.41578)
     | > log_mle: 0.40977  (0.40977)
     | > loss_dur: 1.00600  (1.00600)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.67890  (3.67890)
     | > current_lr: 0.00002 
     | > step_time: 0.77030  (0.77025)
     | > loader_time: 0.36960  (0.36960)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.87585 [0m(-0.03213)
     | > avg_log_mle:[92m 0.42674 [0m(-0.00810)
     | > avg_loss_dur:[92m 1.44912 [0m(-0.02403)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_228.pth

[4m[1m > EPOCH: 76/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:39:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 1.91595 [0m(+0.04010)
     | > avg_log_mle:[92m 0.41872 [0m(-0.00802)
     | > avg_loss_dur:[91m 1.49724 [0m(+0.04812)


[4m[1m > EPOCH: 77/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:40:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.88583 [0m(-0.03013)
     | > avg_log_mle:[92m 0.41079 [0m(-0.00793)
     | > avg_loss_dur:[92m 1.47504 [0m(-0.02220)


[4m[1m > EPOCH: 78/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:40:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 1.85571 [0m(-0.03011)
     | > avg_log_mle:[92m 0.40297 [0m(-0.00782)
     | > avg_loss_dur:[92m 1.45274 [0m(-0.02230)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_237.pth

[4m[1m > EPOCH: 79/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:40:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 1.82656 [0m(-0.02915)
     | > avg_log_mle:[92m 0.39528 [0m(-0.00769)
     | > avg_loss_dur:[92m 1.43129 [0m(-0.02145)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_240.pth

[4m[1m > EPOCH: 80/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:40:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 2.39107 [0m(+0.56450)
     | > avg_log_mle:[92m 0.38771 [0m(-0.00757)
     | > avg_loss_dur:[91m 2.00336 [0m(+0.57207)


[4m[1m > EPOCH: 81/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:40:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 2.35621 [0m(-0.03485)
     | > avg_log_mle:[92m 0.38016 [0m(-0.00755)
     | > avg_loss_dur:[92m 1.97606 [0m(-0.02730)


[4m[1m > EPOCH: 82/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:40:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.34728 [0m(-0.00893)
     | > avg_log_mle:[92m 0.37277 [0m(-0.00738)
     | > avg_loss_dur:[92m 1.97451 [0m(-0.00155)


[4m[1m > EPOCH: 83/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:40:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 250[0m
     | > loss: 1.31352  (1.31352)
     | > log_mle: 0.37540  (0.37540)
     | > loss_dur: 0.93811  (0.93811)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.22537  (3.22537)
     | > current_lr: 0.00002 
     | > step_time: 1.10600  (1.10601)
     | > loader_time: 0.42440  (0.42439)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.31283 [0m(-0.03445)
     | > avg_log_mle:[92m 0.36561 [0m(-0.00717)
     | > avg_loss_dur:[92m 1.94722 [0m(-0.02729)


[4m[1m > EPOCH: 84/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:40:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.27792 [0m(-0.03491)
     | > avg_log_mle:[92m 0.35860 [0m(-0.00700)
     | > avg_loss_dur:[92m 1.91931 [0m(-0.02791)


[4m[1m > EPOCH: 85/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.24476 [0m(-0.03316)
     | > avg_log_mle:[92m 0.35160 [0m(-0.00700)
     | > avg_loss_dur:[92m 1.89316 [0m(-0.02615)


[4m[1m > EPOCH: 86/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.21714 [0m(-0.02762)
     | > avg_log_mle:[92m 0.34469 [0m(-0.00691)
     | > avg_loss_dur:[92m 1.87245 [0m(-0.02071)


[4m[1m > EPOCH: 87/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.18377 [0m(-0.03337)
     | > avg_log_mle:[92m 0.33793 [0m(-0.00676)
     | > avg_loss_dur:[92m 1.84584 [0m(-0.02661)


[4m[1m > EPOCH: 88/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 2.14492 [0m(-0.03885)
     | > avg_log_mle:[92m 0.33125 [0m(-0.00668)
     | > avg_loss_dur:[92m 1.81367 [0m(-0.03217)


[4m[1m > EPOCH: 89/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 2.11671 [0m(-0.02821)
     | > avg_log_mle:[92m 0.32443 [0m(-0.00683)
     | > avg_loss_dur:[92m 1.79228 [0m(-0.02138)


[4m[1m > EPOCH: 90/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 2.08943 [0m(-0.02728)
     | > avg_log_mle:[92m 0.31756 [0m(-0.00687)
     | > avg_loss_dur:[92m 1.77187 [0m(-0.02041)


[4m[1m > EPOCH: 91/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 275[0m
     | > loss: 1.18560  (1.16731)
     | > log_mle: 0.29909  (0.31531)
     | > loss_dur: 0.88651  (0.85200)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.85827  (2.82007)
     | > current_lr: 0.00002 
     | > step_time: 0.42860  (0.84950)
     | > loader_time: 0.11260  (0.28702)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 2.06303 [0m(-0.02640)
     | > avg_log_mle:[92m 0.31083 [0m(-0.00673)
     | > avg_loss_dur:[92m 1.75220 [0m(-0.01967)


[4m[1m > EPOCH: 92/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 2.03690 [0m(-0.02612)
     | > avg_log_mle:[92m 0.30418 [0m(-0.00665)
     | > avg_loss_dur:[92m 1.73273 [0m(-0.01947)


[4m[1m > EPOCH: 93/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:41:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 2.01102 [0m(-0.02588)
     | > avg_log_mle:[92m 0.29736 [0m(-0.00681)
     | > avg_loss_dur:[92m 1.71366 [0m(-0.01907)


[4m[1m > EPOCH: 94/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:42:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 1.98585 [0m(-0.02518)
     | > avg_log_mle:[92m 0.29065 [0m(-0.00671)
     | > avg_loss_dur:[92m 1.69519 [0m(-0.01846)


[4m[1m > EPOCH: 95/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:42:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 1.92874 [0m(-0.05711)
     | > avg_log_mle:[92m 0.28406 [0m(-0.00659)
     | > avg_loss_dur:[92m 1.64468 [0m(-0.05052)


[4m[1m > EPOCH: 96/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:42:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 1.91883 [0m(-0.00991)
     | > avg_log_mle:[92m 0.27752 [0m(-0.00654)
     | > avg_loss_dur:[92m 1.64130 [0m(-0.00337)


[4m[1m > EPOCH: 97/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:42:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 1.89541 [0m(-0.02342)
     | > avg_log_mle:[92m 0.27101 [0m(-0.00651)
     | > avg_loss_dur:[92m 1.62440 [0m(-0.01690)


[4m[1m > EPOCH: 98/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:42:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00300)
     | > avg_loss:[92m 1.86891 [0m(-0.02649)
     | > avg_log_mle:[92m 0.26458 [0m(-0.00643)
     | > avg_loss_dur:[92m 1.60433 [0m(-0.02006)


[4m[1m > EPOCH: 99/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:42:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00200)
     | > avg_loss:[92m 1.84550 [0m(-0.02342)
     | > avg_log_mle:[92m 0.25808 [0m(-0.00650)
     | > avg_loss_dur:[92m 1.58742 [0m(-0.01691)


[4m[1m > EPOCH: 100/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:42:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 300[0m
     | > loss: 0.92039  (0.92039)
     | > log_mle: 0.26557  (0.26557)
     | > loss_dur: 0.65482  (0.65482)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.33307  (2.33307)
     | > current_lr: 0.00002 
     | > step_time: 0.73170  (0.73166)
     | > loader_time: 0.33230  (0.33230)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 1.82004 [0m(-0.02546)
     | > avg_log_mle:[92m 0.25151 [0m(-0.00657)
     | > avg_loss_dur:[92m 1.56853 [0m(-0.01889)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_303.pth

[4m[1m > EPOCH: 101/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:42:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 1.85509 [0m(+0.03505)
     | > avg_log_mle:[92m 0.24504 [0m(-0.00647)
     | > avg_loss_dur:[91m 1.61006 [0m(+0.04152)


[4m[1m > EPOCH: 102/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:43:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 1.83551 [0m(-0.01959)
     | > avg_log_mle:[92m 0.23845 [0m(-0.00659)
     | > avg_loss_dur:[92m 1.59706 [0m(-0.01300)


[4m[1m > EPOCH: 103/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:43:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 1.81395 [0m(-0.02156)
     | > avg_log_mle:[92m 0.23192 [0m(-0.00653)
     | > avg_loss_dur:[92m 1.58203 [0m(-0.01503)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_312.pth

[4m[1m > EPOCH: 104/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:43:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.80304 [0m(-0.01091)
     | > avg_log_mle:[92m 0.22537 [0m(-0.00654)
     | > avg_loss_dur:[92m 1.57767 [0m(-0.00436)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_315.pth

[4m[1m > EPOCH: 105/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:43:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 1.78209 [0m(-0.02095)
     | > avg_log_mle:[92m 0.21872 [0m(-0.00665)
     | > avg_loss_dur:[92m 1.56337 [0m(-0.01430)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_318.pth

[4m[1m > EPOCH: 106/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:43:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 1.24125 [0m(-0.54084)
     | > avg_log_mle:[92m 0.21224 [0m(-0.00648)
     | > avg_loss_dur:[92m 1.02901 [0m(-0.53436)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_321.pth

[4m[1m > EPOCH: 107/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:43:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[92m 1.22749 [0m(-0.01376)
     | > avg_log_mle:[92m 0.20579 [0m(-0.00645)
     | > avg_loss_dur:[92m 1.02170 [0m(-0.00731)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_324.pth

[4m[1m > EPOCH: 108/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:43:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 325[0m
     | > loss: 0.88739  (0.88739)
     | > log_mle: 0.23550  (0.23550)
     | > loss_dur: 0.65189  (0.65189)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.12869  (2.12869)
     | > current_lr: 0.00003 
     | > step_time: 1.03390  (1.03394)
     | > loader_time: 0.43040  (0.43039)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 1.21366 [0m(-0.01383)
     | > avg_log_mle:[92m 0.19948 [0m(-0.00631)
     | > avg_loss_dur:[92m 1.01418 [0m(-0.00752)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_327.pth

[4m[1m > EPOCH: 109/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:43:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 1.20021 [0m(-0.01345)
     | > avg_log_mle:[92m 0.19318 [0m(-0.00629)
     | > avg_loss_dur:[92m 1.00703 [0m(-0.00715)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_330.pth

[4m[1m > EPOCH: 110/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:44:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[92m 1.18168 [0m(-0.01853)
     | > avg_log_mle:[92m 0.18708 [0m(-0.00610)
     | > avg_loss_dur:[92m 0.99460 [0m(-0.01243)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_333.pth

[4m[1m > EPOCH: 111/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:44:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 1.16479 [0m(-0.01689)
     | > avg_log_mle:[92m 0.18098 [0m(-0.00611)
     | > avg_loss_dur:[92m 0.98381 [0m(-0.01078)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_336.pth

[4m[1m > EPOCH: 112/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:44:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.15156 [0m(-0.01324)
     | > avg_log_mle:[92m 0.17488 [0m(-0.00610)
     | > avg_loss_dur:[92m 0.97667 [0m(-0.00714)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_339.pth

[4m[1m > EPOCH: 113/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:44:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 1.25546 [0m(+0.10390)
     | > avg_log_mle:[92m 0.16886 [0m(-0.00602)
     | > avg_loss_dur:[91m 1.08660 [0m(+0.10992)


[4m[1m > EPOCH: 114/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:44:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 1.24434 [0m(-0.01111)
     | > avg_log_mle:[92m 0.16315 [0m(-0.00571)
     | > avg_loss_dur:[92m 1.08120 [0m(-0.00540)


[4m[1m > EPOCH: 115/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:44:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 1.23255 [0m(-0.01180)
     | > avg_log_mle:[92m 0.15732 [0m(-0.00583)
     | > avg_loss_dur:[92m 1.07523 [0m(-0.00597)


[4m[1m > EPOCH: 116/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:44:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 350[0m
     | > loss: 0.82620  (0.81030)
     | > log_mle: 0.15001  (0.17352)
     | > loss_dur: 0.67619  (0.63678)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.11574  (2.02482)
     | > current_lr: 0.00003 
     | > step_time: 0.40540  (0.74418)
     | > loader_time: 0.10210  (0.27375)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[92m 1.21809 [0m(-0.01446)
     | > avg_log_mle:[92m 0.15173 [0m(-0.00559)
     | > avg_loss_dur:[92m 1.06636 [0m(-0.00887)


[4m[1m > EPOCH: 117/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:45:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 1.20412 [0m(-0.01396)
     | > avg_log_mle:[92m 0.14601 [0m(-0.00572)
     | > avg_loss_dur:[92m 1.05811 [0m(-0.00824)


[4m[1m > EPOCH: 118/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:45:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00801 [0m(+0.00000)
     | > avg_loss:[92m 1.19508 [0m(-0.00904)
     | > avg_log_mle:[92m 0.14047 [0m(-0.00554)
     | > avg_loss_dur:[92m 1.05461 [0m(-0.00350)


[4m[1m > EPOCH: 119/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:45:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 1.19406 [0m(-0.00102)
     | > avg_log_mle:[92m 0.13488 [0m(-0.00559)
     | > avg_loss_dur:[91m 1.05917 [0m(+0.00456)


[4m[1m > EPOCH: 120/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:45:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.18063 [0m(-0.01342)
     | > avg_log_mle:[92m 0.12948 [0m(-0.00540)
     | > avg_loss_dur:[92m 1.05115 [0m(-0.00802)


[4m[1m > EPOCH: 121/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:45:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 1.16748 [0m(-0.01315)
     | > avg_log_mle:[92m 0.12414 [0m(-0.00534)
     | > avg_loss_dur:[92m 1.04334 [0m(-0.00781)


[4m[1m > EPOCH: 122/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:45:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 1.15268 [0m(-0.01480)
     | > avg_log_mle:[92m 0.11890 [0m(-0.00525)
     | > avg_loss_dur:[92m 1.03379 [0m(-0.00955)


[4m[1m > EPOCH: 123/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:45:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 1.13885 [0m(-0.01383)
     | > avg_log_mle:[92m 0.11397 [0m(-0.00493)
     | > avg_loss_dur:[92m 1.02488 [0m(-0.00891)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_372.pth

[4m[1m > EPOCH: 124/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:45:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.13413 [0m(-0.00472)
     | > avg_log_mle:[92m 0.10952 [0m(-0.00445)
     | > avg_loss_dur:[92m 1.02461 [0m(-0.00027)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_375.pth

[4m[1m > EPOCH: 125/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:46:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 375[0m
     | > loss: 0.63250  (0.63250)
     | > log_mle: 0.14282  (0.14282)
     | > loss_dur: 0.48968  (0.48968)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.77318  (1.77318)
     | > current_lr: 0.00003 
     | > step_time: 0.72770  (0.72766)
     | > loader_time: 0.33930  (0.33931)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 1.11097 [0m(-0.02316)
     | > avg_log_mle:[92m 0.10558 [0m(-0.00394)
     | > avg_loss_dur:[92m 1.00539 [0m(-0.01922)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_378.pth

[4m[1m > EPOCH: 126/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:46:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 1.09747 [0m(-0.01350)
     | > avg_log_mle:[92m 0.10025 [0m(-0.00533)
     | > avg_loss_dur:[92m 0.99722 [0m(-0.00816)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_381.pth

[4m[1m > EPOCH: 127/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:46:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[92m 1.09492 [0m(-0.00255)
     | > avg_log_mle:[92m 0.09449 [0m(-0.00576)
     | > avg_loss_dur:[91m 1.00043 [0m(+0.00321)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_384.pth

[4m[1m > EPOCH: 128/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:46:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00801 [0m(+0.00000)
     | > avg_loss:[92m 1.07773 [0m(-0.01719)
     | > avg_log_mle:[92m 0.08990 [0m(-0.00459)
     | > avg_loss_dur:[92m 0.98783 [0m(-0.01260)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_387.pth

[4m[1m > EPOCH: 129/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:46:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00801 [0m(+0.00000)
     | > avg_loss:[92m 1.06558 [0m(-0.01216)
     | > avg_log_mle:[92m 0.08507 [0m(-0.00483)
     | > avg_loss_dur:[92m 0.98051 [0m(-0.00732)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_390.pth

[4m[1m > EPOCH: 130/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:46:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 1.06762 [0m(+0.00204)
     | > avg_log_mle:[92m 0.08125 [0m(-0.00382)
     | > avg_loss_dur:[91m 0.98637 [0m(+0.00586)


[4m[1m > EPOCH: 131/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:46:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 1.04442 [0m(-0.02320)
     | > avg_log_mle:[92m 0.07678 [0m(-0.00447)
     | > avg_loss_dur:[92m 0.96764 [0m(-0.01873)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_396.pth

[4m[1m > EPOCH: 132/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:47:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.03608 [0m(-0.00833)
     | > avg_log_mle:[92m 0.07186 [0m(-0.00491)
     | > avg_loss_dur:[92m 0.96422 [0m(-0.00342)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_399.pth

[4m[1m > EPOCH: 133/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:47:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 400[0m
     | > loss: 0.63558  (0.63558)
     | > log_mle: 0.12735  (0.12735)
     | > loss_dur: 0.50824  (0.50824)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.63074  (1.63074)
     | > current_lr: 0.00003 
     | > step_time: 1.03890  (1.03894)
     | > loader_time: 0.42340  (0.42339)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.02371 [0m(-0.01237)
     | > avg_log_mle:[92m 0.06726 [0m(-0.00460)
     | > avg_loss_dur:[92m 0.95645 [0m(-0.00777)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_402.pth

[4m[1m > EPOCH: 134/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:47:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 1.01182 [0m(-0.01190)
     | > avg_log_mle:[92m 0.06284 [0m(-0.00442)
     | > avg_loss_dur:[92m 0.94898 [0m(-0.00747)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_405.pth

[4m[1m > EPOCH: 135/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:47:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 1.00068 [0m(-0.01113)
     | > avg_log_mle:[92m 0.05848 [0m(-0.00435)
     | > avg_loss_dur:[92m 0.94220 [0m(-0.00678)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_408.pth

[4m[1m > EPOCH: 136/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:47:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.99404 [0m(-0.00665)
     | > avg_log_mle:[92m 0.05424 [0m(-0.00424)
     | > avg_loss_dur:[92m 0.93980 [0m(-0.00240)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_411.pth

[4m[1m > EPOCH: 137/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:47:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.98382 [0m(-0.01021)
     | > avg_log_mle:[92m 0.05025 [0m(-0.00399)
     | > avg_loss_dur:[92m 0.93358 [0m(-0.00622)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_414.pth

[4m[1m > EPOCH: 138/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:48:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 0.96286 [0m(-0.02096)
     | > avg_log_mle:[92m 0.04652 [0m(-0.00373)
     | > avg_loss_dur:[92m 0.91635 [0m(-0.01723)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_417.pth

[4m[1m > EPOCH: 139/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:48:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00200)
     | > avg_loss:[92m 0.95706 [0m(-0.00580)
     | > avg_log_mle:[92m 0.04400 [0m(-0.00252)
     | > avg_loss_dur:[92m 0.91307 [0m(-0.00328)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_420.pth

[4m[1m > EPOCH: 140/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:48:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00300)
     | > avg_loss:[92m 0.95143 [0m(-0.00564)
     | > avg_log_mle:[92m 0.03934 [0m(-0.00465)
     | > avg_loss_dur:[92m 0.91208 [0m(-0.00098)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_423.pth

[4m[1m > EPOCH: 141/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:48:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 425[0m
     | > loss: 0.58697  (0.58194)
     | > log_mle: 0.04147  (0.06950)
     | > loss_dur: 0.54550  (0.51244)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.30854  (2.07072)
     | > current_lr: 0.00004 
     | > step_time: 0.39840  (0.71815)
     | > loader_time: 0.10710  (0.26774)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.92446 [0m(-0.02697)
     | > avg_log_mle:[92m 0.03283 [0m(-0.00652)
     | > avg_loss_dur:[92m 0.89163 [0m(-0.02045)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_426.pth

[4m[1m > EPOCH: 142/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:48:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 1.02905 [0m(+0.10459)
     | > avg_log_mle:[92m 0.02933 [0m(-0.00350)
     | > avg_loss_dur:[91m 0.99972 [0m(+0.10809)


[4m[1m > EPOCH: 143/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:48:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 1.02463 [0m(-0.00442)
     | > avg_log_mle:[92m 0.02544 [0m(-0.00388)
     | > avg_loss_dur:[92m 0.99919 [0m(-0.00053)


[4m[1m > EPOCH: 144/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:48:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.90937 [0m(-0.11526)
     | > avg_log_mle:[92m 0.02241 [0m(-0.00303)
     | > avg_loss_dur:[92m 0.88696 [0m(-0.11223)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_435.pth

[4m[1m > EPOCH: 145/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:49:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.89294 [0m(-0.01643)
     | > avg_log_mle:[92m 0.01752 [0m(-0.00489)
     | > avg_loss_dur:[92m 0.87542 [0m(-0.01154)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_438.pth

[4m[1m > EPOCH: 146/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:49:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.98961 [0m(+0.09667)
     | > avg_log_mle:[92m 0.01321 [0m(-0.00431)
     | > avg_loss_dur:[91m 0.97640 [0m(+0.10098)


[4m[1m > EPOCH: 147/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:49:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.87456 [0m(-0.11505)
     | > avg_log_mle:[92m 0.01002 [0m(-0.00319)
     | > avg_loss_dur:[92m 0.86454 [0m(-0.11186)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_444.pth

[4m[1m > EPOCH: 148/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:49:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.86596 [0m(-0.00860)
     | > avg_log_mle:[92m 0.00662 [0m(-0.00340)
     | > avg_loss_dur:[92m 0.85934 [0m(-0.00520)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_447.pth

[4m[1m > EPOCH: 149/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:49:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.96855 [0m(+0.10259)
     | > avg_log_mle:[92m 0.00286 [0m(-0.00376)
     | > avg_loss_dur:[91m 0.96570 [0m(+0.10635)


[4m[1m > EPOCH: 150/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:49:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 450[0m
     | > loss: 0.44081  (0.44081)
     | > log_mle: 0.04712  (0.04712)
     | > loss_dur: 0.39369  (0.39369)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.31674  (1.31674)
     | > current_lr: 0.00004 
     | > step_time: 0.83180  (0.83176)
     | > loader_time: 0.32930  (0.32930)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.95911 [0m(-0.00944)
     | > avg_log_mle:[92m -0.00159 [0m(-0.00445)
     | > avg_loss_dur:[92m 0.96071 [0m(-0.00499)


[4m[1m > EPOCH: 151/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:49:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 1.02040 [0m(+0.06129)
     | > avg_log_mle:[92m -0.00590 [0m(-0.00431)
     | > avg_loss_dur:[91m 1.02630 [0m(+0.06560)


[4m[1m > EPOCH: 152/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:50:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 1.01377 [0m(-0.00664)
     | > avg_log_mle:[92m -0.00887 [0m(-0.00297)
     | > avg_loss_dur:[92m 1.02263 [0m(-0.00367)


[4m[1m > EPOCH: 153/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:50:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 1.00485 [0m(-0.00891)
     | > avg_log_mle:[92m -0.01279 [0m(-0.00392)
     | > avg_loss_dur:[92m 1.01764 [0m(-0.00499)


[4m[1m > EPOCH: 154/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:50:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 1.03317 [0m(+0.02832)
     | > avg_log_mle:[92m -0.01648 [0m(-0.00370)
     | > avg_loss_dur:[91m 1.04966 [0m(+0.03202)


[4m[1m > EPOCH: 155/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:50:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 1.03945 [0m(+0.00628)
     | > avg_log_mle:[92m -0.02003 [0m(-0.00354)
     | > avg_loss_dur:[91m 1.05948 [0m(+0.00982)


[4m[1m > EPOCH: 156/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:50:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 1.03350 [0m(-0.00595)
     | > avg_log_mle:[92m -0.02211 [0m(-0.00208)
     | > avg_loss_dur:[92m 1.05561 [0m(-0.00387)


[4m[1m > EPOCH: 157/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:50:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[92m 1.02637 [0m(-0.00713)
     | > avg_log_mle:[92m -0.02467 [0m(-0.00256)
     | > avg_loss_dur:[92m 1.05104 [0m(-0.00457)


[4m[1m > EPOCH: 158/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:50:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 475[0m
     | > loss: 0.46472  (0.46472)
     | > log_mle: 0.03680  (0.03680)
     | > loss_dur: 0.42792  (0.42792)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.45978  (1.45978)
     | > current_lr: 0.00004 
     | > step_time: 1.03790  (1.03794)
     | > loader_time: 0.42840  (0.42839)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 1.01847 [0m(-0.00791)
     | > avg_log_mle:[92m -0.03147 [0m(-0.00680)
     | > avg_loss_dur:[92m 1.04993 [0m(-0.00111)


[4m[1m > EPOCH: 159/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:51:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 1.00935 [0m(-0.00912)
     | > avg_log_mle:[92m -0.03606 [0m(-0.00460)
     | > avg_loss_dur:[92m 1.04541 [0m(-0.00452)


[4m[1m > EPOCH: 160/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:51:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.98291 [0m(-0.02644)
     | > avg_log_mle:[92m -0.04022 [0m(-0.00416)
     | > avg_loss_dur:[92m 1.02314 [0m(-0.02228)


[4m[1m > EPOCH: 161/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:51:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.97548 [0m(-0.00743)
     | > avg_log_mle:[92m -0.04360 [0m(-0.00338)
     | > avg_loss_dur:[92m 1.01908 [0m(-0.00405)


[4m[1m > EPOCH: 162/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:51:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.96904 [0m(-0.00645)
     | > avg_log_mle:[92m -0.04645 [0m(-0.00285)
     | > avg_loss_dur:[92m 1.01549 [0m(-0.00360)


[4m[1m > EPOCH: 163/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:51:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.95997 [0m(-0.00907)
     | > avg_log_mle:[91m -0.04562 [0m(+0.00084)
     | > avg_loss_dur:[92m 1.00558 [0m(-0.00990)


[4m[1m > EPOCH: 164/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:51:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.94912 [0m(-0.01084)
     | > avg_log_mle:[91m -0.03896 [0m(+0.00665)
     | > avg_loss_dur:[92m 0.98808 [0m(-0.01750)


[4m[1m > EPOCH: 165/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:51:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.95036 [0m(+0.00124)
     | > avg_log_mle:[92m -0.05148 [0m(-0.01251)
     | > avg_loss_dur:[91m 1.00184 [0m(+0.01375)


[4m[1m > EPOCH: 166/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:52:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 500[0m
     | > loss: 0.42036  (0.42071)
     | > log_mle: -0.05366  (-0.02089)
     | > loss_dur: 0.47401  (0.44160)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.81297  (1.99152)
     | > current_lr: 0.00004 
     | > step_time: 0.39440  (0.71615)
     | > loader_time: 0.10010  (0.27375)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.82387 [0m(-0.12650)
     | > avg_log_mle:[92m -0.05874 [0m(-0.00727)
     | > avg_loss_dur:[92m 0.88261 [0m(-0.11923)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_501.pth

[4m[1m > EPOCH: 167/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:52:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[91m 0.88699 [0m(+0.06312)
     | > avg_log_mle:[92m -0.05991 [0m(-0.00116)
     | > avg_loss_dur:[91m 0.94689 [0m(+0.06428)


[4m[1m > EPOCH: 168/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:52:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00100)
     | > avg_loss:[91m 0.93001 [0m(+0.04302)
     | > avg_log_mle:[92m -0.06288 [0m(-0.00297)
     | > avg_loss_dur:[91m 0.99288 [0m(+0.04599)


[4m[1m > EPOCH: 169/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:52:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01802 [0m(+0.00601)
     | > avg_loss:[92m 0.72647 [0m(-0.20354)
     | > avg_log_mle:[92m -0.07030 [0m(-0.00742)
     | > avg_loss_dur:[92m 0.79677 [0m(-0.19612)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_510.pth

[4m[1m > EPOCH: 170/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:52:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00801)
     | > avg_loss:[91m 0.82542 [0m(+0.09895)
     | > avg_log_mle:[92m -0.07069 [0m(-0.00039)
     | > avg_loss_dur:[91m 0.89611 [0m(+0.09934)


[4m[1m > EPOCH: 171/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:52:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.88686 [0m(+0.06144)
     | > avg_log_mle:[92m -0.07085 [0m(-0.00016)
     | > avg_loss_dur:[91m 0.95771 [0m(+0.06160)


[4m[1m > EPOCH: 172/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:52:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.81475 [0m(-0.07211)
     | > avg_log_mle:[92m -0.07824 [0m(-0.00739)
     | > avg_loss_dur:[92m 0.89299 [0m(-0.06472)


[4m[1m > EPOCH: 173/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:53:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.81191 [0m(-0.00284)
     | > avg_log_mle:[92m -0.07971 [0m(-0.00147)
     | > avg_loss_dur:[92m 0.89162 [0m(-0.00137)


[4m[1m > EPOCH: 174/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:53:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[91m 0.86266 [0m(+0.05075)
     | > avg_log_mle:[92m -0.08012 [0m(-0.00041)
     | > avg_loss_dur:[91m 0.94278 [0m(+0.05116)


[4m[1m > EPOCH: 175/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:53:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 525[0m
     | > loss: 0.30249  (0.30249)
     | > log_mle: -0.03648  (-0.03648)
     | > loss_dur: 0.33897  (0.33897)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.70249  (1.70249)
     | > current_lr: 0.00004 
     | > step_time: 0.73470  (0.73467)
     | > loader_time: 0.34830  (0.34832)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[92m 0.79928 [0m(-0.06338)
     | > avg_log_mle:[92m -0.08802 [0m(-0.00790)
     | > avg_loss_dur:[92m 0.88730 [0m(-0.05548)


[4m[1m > EPOCH: 176/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:53:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.78464 [0m(-0.01464)
     | > avg_log_mle:[92m -0.09234 [0m(-0.00431)
     | > avg_loss_dur:[92m 0.87697 [0m(-0.01033)


[4m[1m > EPOCH: 177/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:53:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.79492 [0m(+0.01028)
     | > avg_log_mle:[91m -0.09173 [0m(+0.00061)
     | > avg_loss_dur:[91m 0.88665 [0m(+0.00967)


[4m[1m > EPOCH: 178/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:53:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.78443 [0m(-0.01049)
     | > avg_log_mle:[92m -0.09560 [0m(-0.00387)
     | > avg_loss_dur:[92m 0.88002 [0m(-0.00662)


[4m[1m > EPOCH: 179/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:53:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.77649 [0m(-0.00794)
     | > avg_log_mle:[92m -0.10138 [0m(-0.00579)
     | > avg_loss_dur:[92m 0.87787 [0m(-0.00216)


[4m[1m > EPOCH: 180/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:54:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.76800 [0m(-0.00848)
     | > avg_log_mle:[92m -0.10362 [0m(-0.00223)
     | > avg_loss_dur:[92m 0.87162 [0m(-0.00625)


[4m[1m > EPOCH: 181/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:54:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.82465 [0m(+0.05665)
     | > avg_log_mle:[92m -0.10392 [0m(-0.00030)
     | > avg_loss_dur:[91m 0.92857 [0m(+0.05696)


[4m[1m > EPOCH: 182/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:54:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.82572 [0m(+0.00106)
     | > avg_log_mle:[92m -0.10404 [0m(-0.00012)
     | > avg_loss_dur:[91m 0.92976 [0m(+0.00119)


[4m[1m > EPOCH: 183/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:54:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 550[0m
     | > loss: 0.33527  (0.33527)
     | > log_mle: -0.03989  (-0.03989)
     | > loss_dur: 0.37516  (0.37516)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.51688  (3.51688)
     | > current_lr: 0.00005 
     | > step_time: 1.07500  (1.07498)
     | > loader_time: 0.43540  (0.43540)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.80777 [0m(-0.01795)
     | > avg_log_mle:[92m -0.10634 [0m(-0.00230)
     | > avg_loss_dur:[92m 0.91411 [0m(-0.01565)


[4m[1m > EPOCH: 184/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:54:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.73978 [0m(-0.06799)
     | > avg_log_mle:[92m -0.11169 [0m(-0.00535)
     | > avg_loss_dur:[92m 0.85148 [0m(-0.06263)


[4m[1m > EPOCH: 185/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:54:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.72477 [0m(-0.01502)
     | > avg_log_mle:[92m -0.11609 [0m(-0.00440)
     | > avg_loss_dur:[92m 0.84086 [0m(-0.01062)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_558.pth

[4m[1m > EPOCH: 186/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:54:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.72738 [0m(+0.00261)
     | > avg_log_mle:[91m -0.11543 [0m(+0.00066)
     | > avg_loss_dur:[91m 0.84281 [0m(+0.00195)


[4m[1m > EPOCH: 187/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:55:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.73904 [0m(+0.01166)
     | > avg_log_mle:[92m -0.12061 [0m(-0.00517)
     | > avg_loss_dur:[91m 0.85965 [0m(+0.01684)


[4m[1m > EPOCH: 188/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:55:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.72871 [0m(-0.01033)
     | > avg_log_mle:[92m -0.12510 [0m(-0.00449)
     | > avg_loss_dur:[92m 0.85381 [0m(-0.00584)


[4m[1m > EPOCH: 189/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:55:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.61461 [0m(-0.11410)
     | > avg_log_mle:[92m -0.12813 [0m(-0.00303)
     | > avg_loss_dur:[92m 0.74274 [0m(-0.11106)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_570.pth

[4m[1m > EPOCH: 190/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:55:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.72412 [0m(+0.10951)
     | > avg_log_mle:[92m -0.12921 [0m(-0.00108)
     | > avg_loss_dur:[91m 0.85333 [0m(+0.11059)


[4m[1m > EPOCH: 191/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:55:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 575[0m
     | > loss: 0.29276  (0.29731)
     | > log_mle: -0.13517  (-0.09815)
     | > loss_dur: 0.42793  (0.39546)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.27611  (2.18727)
     | > current_lr: 0.00005 
     | > step_time: 0.39540  (0.71765)
     | > loader_time: 0.10510  (0.26274)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.74863 [0m(+0.02451)
     | > avg_log_mle:[91m -0.12260 [0m(+0.00661)
     | > avg_loss_dur:[91m 0.87122 [0m(+0.01789)


[4m[1m > EPOCH: 192/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:55:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.72899 [0m(-0.01964)
     | > avg_log_mle:[92m -0.13136 [0m(-0.00876)
     | > avg_loss_dur:[92m 0.86034 [0m(-0.01088)


[4m[1m > EPOCH: 193/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:55:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.58679 [0m(-0.14220)
     | > avg_log_mle:[92m -0.13687 [0m(-0.00552)
     | > avg_loss_dur:[92m 0.72367 [0m(-0.13668)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_582.pth

[4m[1m > EPOCH: 194/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:56:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.67473 [0m(+0.08794)
     | > avg_log_mle:[91m -0.13463 [0m(+0.00224)
     | > avg_loss_dur:[91m 0.80936 [0m(+0.08570)


[4m[1m > EPOCH: 195/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:56:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.68054 [0m(+0.00581)
     | > avg_log_mle:[92m -0.13844 [0m(-0.00381)
     | > avg_loss_dur:[91m 0.81898 [0m(+0.00961)


[4m[1m > EPOCH: 196/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:56:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.64536 [0m(-0.03517)
     | > avg_log_mle:[92m -0.14398 [0m(-0.00554)
     | > avg_loss_dur:[92m 0.78934 [0m(-0.02963)


[4m[1m > EPOCH: 197/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:56:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.68925 [0m(+0.04389)
     | > avg_log_mle:[91m -0.14262 [0m(+0.00136)
     | > avg_loss_dur:[91m 0.83186 [0m(+0.04252)


[4m[1m > EPOCH: 198/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:56:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.67650 [0m(-0.01274)
     | > avg_log_mle:[91m -0.14131 [0m(+0.00130)
     | > avg_loss_dur:[92m 0.81782 [0m(-0.01405)


[4m[1m > EPOCH: 199/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:56:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.65923 [0m(-0.01727)
     | > avg_log_mle:[92m -0.15025 [0m(-0.00894)
     | > avg_loss_dur:[92m 0.80948 [0m(-0.00834)


[4m[1m > EPOCH: 200/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:56:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 600[0m
     | > loss: 0.20209  (0.20209)
     | > log_mle: -0.10729  (-0.10729)
     | > loss_dur: 0.30938  (0.30938)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.88347  (2.88347)
     | > current_lr: 0.00005 
     | > step_time: 0.76270  (0.76269)
     | > loader_time: 0.33030  (0.33030)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.54994 [0m(-0.10929)
     | > avg_log_mle:[92m -0.15216 [0m(-0.00191)
     | > avg_loss_dur:[92m 0.70210 [0m(-0.10738)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_603.pth

[4m[1m > EPOCH: 201/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:57:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.66938 [0m(+0.11944)
     | > avg_log_mle:[91m -0.14826 [0m(+0.00389)
     | > avg_loss_dur:[91m 0.81764 [0m(+0.11555)


[4m[1m > EPOCH: 202/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:57:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.65403 [0m(-0.01535)
     | > avg_log_mle:[92m -0.15318 [0m(-0.00492)
     | > avg_loss_dur:[92m 0.80722 [0m(-0.01043)


[4m[1m > EPOCH: 203/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:57:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.63193 [0m(-0.02210)
     | > avg_log_mle:[92m -0.15963 [0m(-0.00645)
     | > avg_loss_dur:[92m 0.79156 [0m(-0.01566)


[4m[1m > EPOCH: 204/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:57:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.62681 [0m(-0.00512)
     | > avg_log_mle:[92m -0.16094 [0m(-0.00131)
     | > avg_loss_dur:[92m 0.78775 [0m(-0.00381)


[4m[1m > EPOCH: 205/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:57:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.63108 [0m(+0.00427)
     | > avg_log_mle:[91m -0.15977 [0m(+0.00117)
     | > avg_loss_dur:[91m 0.79085 [0m(+0.00310)


[4m[1m > EPOCH: 206/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:57:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.58424 [0m(-0.04684)
     | > avg_log_mle:[92m -0.16517 [0m(-0.00540)
     | > avg_loss_dur:[92m 0.74941 [0m(-0.04144)


[4m[1m > EPOCH: 207/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:57:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.61941 [0m(+0.03517)
     | > avg_log_mle:[92m -0.16826 [0m(-0.00309)
     | > avg_loss_dur:[91m 0.78767 [0m(+0.03826)


[4m[1m > EPOCH: 208/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:58:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 625[0m
     | > loss: 0.23084  (0.23084)
     | > log_mle: -0.10499  (-0.10499)
     | > loss_dur: 0.33582  (0.33582)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.01384  (3.01384)
     | > current_lr: 0.00005 
     | > step_time: 1.03200  (1.03196)
     | > loader_time: 0.42740  (0.42739)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.59520 [0m(-0.02421)
     | > avg_log_mle:[91m -0.16821 [0m(+0.00005)
     | > avg_loss_dur:[92m 0.76342 [0m(-0.02425)


[4m[1m > EPOCH: 209/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:58:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.60376 [0m(+0.00856)
     | > avg_log_mle:[91m -0.16461 [0m(+0.00360)
     | > avg_loss_dur:[91m 0.76837 [0m(+0.00496)


[4m[1m > EPOCH: 210/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:58:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.59017 [0m(-0.01359)
     | > avg_log_mle:[92m -0.17231 [0m(-0.00769)
     | > avg_loss_dur:[92m 0.76248 [0m(-0.00590)


[4m[1m > EPOCH: 211/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:58:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.59812 [0m(+0.00795)
     | > avg_log_mle:[92m -0.17690 [0m(-0.00459)
     | > avg_loss_dur:[91m 0.77501 [0m(+0.01254)


[4m[1m > EPOCH: 212/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:58:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.55459 [0m(-0.04353)
     | > avg_log_mle:[92m -0.17989 [0m(-0.00300)
     | > avg_loss_dur:[92m 0.73448 [0m(-0.04053)


[4m[1m > EPOCH: 213/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:58:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.55302 [0m(-0.00156)
     | > avg_log_mle:[91m -0.17817 [0m(+0.00172)
     | > avg_loss_dur:[92m 0.73120 [0m(-0.00328)


[4m[1m > EPOCH: 214/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:58:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.57919 [0m(+0.02617)
     | > avg_log_mle:[92m -0.17900 [0m(-0.00082)
     | > avg_loss_dur:[91m 0.75819 [0m(+0.02699)


[4m[1m > EPOCH: 215/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:58:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.54871 [0m(-0.03048)
     | > avg_log_mle:[92m -0.17988 [0m(-0.00089)
     | > avg_loss_dur:[92m 0.72859 [0m(-0.02959)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_648.pth

[4m[1m > EPOCH: 216/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:59:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 650[0m
     | > loss: 0.17883  (0.19222)
     | > log_mle: -0.20524  (-0.16512)
     | > loss_dur: 0.38407  (0.35733)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.11580  (3.87304)
     | > current_lr: 0.00005 
     | > step_time: 0.39440  (0.71365)
     | > loader_time: 0.10510  (0.26323)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.58238 [0m(+0.03366)
     | > avg_log_mle:[92m -0.18674 [0m(-0.00686)
     | > avg_loss_dur:[91m 0.76912 [0m(+0.04052)


[4m[1m > EPOCH: 217/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:59:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.56649 [0m(-0.01589)
     | > avg_log_mle:[91m -0.18450 [0m(+0.00224)
     | > avg_loss_dur:[92m 0.75099 [0m(-0.01813)


[4m[1m > EPOCH: 218/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:59:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.56905 [0m(+0.00256)
     | > avg_log_mle:[91m -0.17808 [0m(+0.00642)
     | > avg_loss_dur:[92m 0.74712 [0m(-0.00386)


[4m[1m > EPOCH: 219/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:59:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.53066 [0m(-0.03839)
     | > avg_log_mle:[92m -0.18061 [0m(-0.00253)
     | > avg_loss_dur:[92m 0.71127 [0m(-0.03586)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_660.pth

[4m[1m > EPOCH: 220/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:59:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.55066 [0m(+0.02000)
     | > avg_log_mle:[92m -0.18898 [0m(-0.00837)
     | > avg_loss_dur:[91m 0.73964 [0m(+0.02837)


[4m[1m > EPOCH: 221/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 04:59:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.54580 [0m(-0.00486)
     | > avg_log_mle:[92m -0.19234 [0m(-0.00336)
     | > avg_loss_dur:[92m 0.73814 [0m(-0.00150)


[4m[1m > EPOCH: 222/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:00:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.54897 [0m(+0.00317)
     | > avg_log_mle:[92m -0.19295 [0m(-0.00061)
     | > avg_loss_dur:[91m 0.74192 [0m(+0.00378)


[4m[1m > EPOCH: 223/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:00:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.50261 [0m(-0.04637)
     | > avg_log_mle:[92m -0.19802 [0m(-0.00507)
     | > avg_loss_dur:[92m 0.70063 [0m(-0.04129)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_672.pth

[4m[1m > EPOCH: 224/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:00:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.51073 [0m(+0.00812)
     | > avg_log_mle:[91m -0.19695 [0m(+0.00107)
     | > avg_loss_dur:[91m 0.70768 [0m(+0.00705)


[4m[1m > EPOCH: 225/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:00:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 675[0m
     | > loss: 0.11858  (0.11858)
     | > log_mle: -0.16827  (-0.16827)
     | > loss_dur: 0.28685  (0.28685)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.77941  (5.77941)
     | > current_lr: 0.00006 
     | > step_time: 0.73370  (0.73367)
     | > loader_time: 0.31730  (0.31729)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.56206 [0m(+0.05134)
     | > avg_log_mle:[91m -0.19479 [0m(+0.00216)
     | > avg_loss_dur:[91m 0.75685 [0m(+0.04918)


[4m[1m > EPOCH: 226/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:00:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.51152 [0m(-0.05055)
     | > avg_log_mle:[92m -0.20158 [0m(-0.00679)
     | > avg_loss_dur:[92m 0.71310 [0m(-0.04376)


[4m[1m > EPOCH: 227/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:00:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.51349 [0m(+0.00198)
     | > avg_log_mle:[92m -0.20332 [0m(-0.00174)
     | > avg_loss_dur:[91m 0.71682 [0m(+0.00372)


[4m[1m > EPOCH: 228/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:00:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.53045 [0m(+0.01695)
     | > avg_log_mle:[91m -0.20219 [0m(+0.00113)
     | > avg_loss_dur:[91m 0.73264 [0m(+0.01582)


[4m[1m > EPOCH: 229/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:01:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.51332 [0m(-0.01713)
     | > avg_log_mle:[92m -0.20366 [0m(-0.00147)
     | > avg_loss_dur:[92m 0.71698 [0m(-0.01566)


[4m[1m > EPOCH: 230/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:01:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.46948 [0m(-0.04384)
     | > avg_log_mle:[92m -0.20966 [0m(-0.00599)
     | > avg_loss_dur:[92m 0.67914 [0m(-0.03784)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_693.pth

[4m[1m > EPOCH: 231/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:01:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.50077 [0m(+0.03129)
     | > avg_log_mle:[91m -0.20902 [0m(+0.00064)
     | > avg_loss_dur:[91m 0.70980 [0m(+0.03066)


[4m[1m > EPOCH: 232/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:01:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.45568 [0m(-0.04509)
     | > avg_log_mle:[92m -0.21295 [0m(-0.00393)
     | > avg_loss_dur:[92m 0.66863 [0m(-0.04117)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_699.pth

[4m[1m > EPOCH: 233/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:01:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 700[0m
     | > loss: 0.15975  (0.15975)
     | > log_mle: -0.16054  (-0.16054)
     | > loss_dur: 0.32029  (0.32029)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.01457  (6.01457)
     | > current_lr: 0.00006 
     | > step_time: 1.04190  (1.04195)
     | > loader_time: 0.41740  (0.41738)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.51080 [0m(+0.05513)
     | > avg_log_mle:[91m -0.21237 [0m(+0.00058)
     | > avg_loss_dur:[91m 0.72318 [0m(+0.05455)


[4m[1m > EPOCH: 234/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:01:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.45305 [0m(-0.05775)
     | > avg_log_mle:[92m -0.21455 [0m(-0.00218)
     | > avg_loss_dur:[92m 0.66760 [0m(-0.05558)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_705.pth

[4m[1m > EPOCH: 235/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:02:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.46997 [0m(+0.01692)
     | > avg_log_mle:[92m -0.21587 [0m(-0.00132)
     | > avg_loss_dur:[91m 0.68584 [0m(+0.01824)


[4m[1m > EPOCH: 236/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:02:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.52023 [0m(+0.05026)
     | > avg_log_mle:[91m -0.21561 [0m(+0.00026)
     | > avg_loss_dur:[91m 0.73584 [0m(+0.04999)


[4m[1m > EPOCH: 237/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:02:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.46677 [0m(-0.05345)
     | > avg_log_mle:[91m -0.21452 [0m(+0.00109)
     | > avg_loss_dur:[92m 0.68130 [0m(-0.05454)


[4m[1m > EPOCH: 238/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:02:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.49905 [0m(+0.03228)
     | > avg_log_mle:[92m -0.21545 [0m(-0.00092)
     | > avg_loss_dur:[91m 0.71450 [0m(+0.03320)


[4m[1m > EPOCH: 239/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:02:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.47124 [0m(-0.02781)
     | > avg_log_mle:[92m -0.22266 [0m(-0.00721)
     | > avg_loss_dur:[92m 0.69390 [0m(-0.02060)


[4m[1m > EPOCH: 240/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:02:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.46847 [0m(-0.00277)
     | > avg_log_mle:[91m -0.22178 [0m(+0.00088)
     | > avg_loss_dur:[92m 0.69025 [0m(-0.00365)


[4m[1m > EPOCH: 241/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:02:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 725[0m
     | > loss: 0.11160  (0.12778)
     | > log_mle: -0.26055  (-0.21699)
     | > loss_dur: 0.37215  (0.34476)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.75779  (4.99054)
     | > current_lr: 0.00006 
     | > step_time: 0.41140  (0.72016)
     | > loader_time: 0.10010  (0.26173)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.45105 [0m(-0.01742)
     | > avg_log_mle:[92m -0.22203 [0m(-0.00025)
     | > avg_loss_dur:[92m 0.67307 [0m(-0.01718)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_726.pth

[4m[1m > EPOCH: 242/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:03:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.45449 [0m(+0.00345)
     | > avg_log_mle:[92m -0.22713 [0m(-0.00511)
     | > avg_loss_dur:[91m 0.68163 [0m(+0.00855)


[4m[1m > EPOCH: 243/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:03:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.46417 [0m(+0.00968)
     | > avg_log_mle:[91m -0.22376 [0m(+0.00338)
     | > avg_loss_dur:[91m 0.68793 [0m(+0.00630)


[4m[1m > EPOCH: 244/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:03:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.45394 [0m(-0.01023)
     | > avg_log_mle:[92m -0.22408 [0m(-0.00033)
     | > avg_loss_dur:[92m 0.67802 [0m(-0.00991)


[4m[1m > EPOCH: 245/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:03:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.44928 [0m(-0.00465)
     | > avg_log_mle:[92m -0.22907 [0m(-0.00498)
     | > avg_loss_dur:[91m 0.67835 [0m(+0.00033)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_738.pth

[4m[1m > EPOCH: 246/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:03:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.45057 [0m(+0.00129)
     | > avg_log_mle:[91m -0.22883 [0m(+0.00023)
     | > avg_loss_dur:[91m 0.67940 [0m(+0.00105)


[4m[1m > EPOCH: 247/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:03:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.42607 [0m(-0.02450)
     | > avg_log_mle:[92m -0.22966 [0m(-0.00083)
     | > avg_loss_dur:[92m 0.65573 [0m(-0.02368)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_744.pth

[4m[1m > EPOCH: 248/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:04:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.44542 [0m(+0.01935)
     | > avg_log_mle:[92m -0.23269 [0m(-0.00303)
     | > avg_loss_dur:[91m 0.67811 [0m(+0.02238)


[4m[1m > EPOCH: 249/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:04:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.43247 [0m(-0.01296)
     | > avg_log_mle:[92m -0.23961 [0m(-0.00692)
     | > avg_loss_dur:[92m 0.67208 [0m(-0.00603)


[4m[1m > EPOCH: 250/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:04:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 750[0m
     | > loss: 0.07121  (0.07121)
     | > log_mle: -0.21536  (-0.21536)
     | > loss_dur: 0.28657  (0.28657)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.80546  (2.80546)
     | > current_lr: 0.00006 
     | > step_time: 0.72770  (0.72766)
     | > loader_time: 0.32830  (0.32830)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.44200 [0m(+0.00954)
     | > avg_log_mle:[91m -0.23333 [0m(+0.00629)
     | > avg_loss_dur:[91m 0.67533 [0m(+0.00325)


[4m[1m > EPOCH: 251/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:04:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.47600 [0m(+0.03400)
     | > avg_log_mle:[91m -0.22947 [0m(+0.00386)
     | > avg_loss_dur:[91m 0.70547 [0m(+0.03014)


[4m[1m > EPOCH: 252/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:04:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.44746 [0m(-0.02854)
     | > avg_log_mle:[92m -0.23275 [0m(-0.00328)
     | > avg_loss_dur:[92m 0.68021 [0m(-0.02526)


[4m[1m > EPOCH: 253/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:04:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.49362 [0m(+0.04616)
     | > avg_log_mle:[91m -0.23197 [0m(+0.00078)
     | > avg_loss_dur:[91m 0.72559 [0m(+0.04538)


[4m[1m > EPOCH: 254/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:05:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.46956 [0m(-0.02406)
     | > avg_log_mle:[91m -0.23137 [0m(+0.00060)
     | > avg_loss_dur:[92m 0.70093 [0m(-0.02467)


[4m[1m > EPOCH: 255/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:05:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.41624 [0m(-0.05332)
     | > avg_log_mle:[92m -0.23980 [0m(-0.00843)
     | > avg_loss_dur:[92m 0.65604 [0m(-0.04489)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_768.pth

[4m[1m > EPOCH: 256/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:05:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.46643 [0m(+0.05019)
     | > avg_log_mle:[91m -0.23322 [0m(+0.00658)
     | > avg_loss_dur:[91m 0.69965 [0m(+0.04361)


[4m[1m > EPOCH: 257/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:05:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.47925 [0m(+0.01282)
     | > avg_log_mle:[92m -0.23323 [0m(-0.00001)
     | > avg_loss_dur:[91m 0.71248 [0m(+0.01283)


[4m[1m > EPOCH: 258/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:05:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 775[0m
     | > loss: 0.11976  (0.11976)
     | > log_mle: -0.19454  (-0.19454)
     | > loss_dur: 0.31431  (0.31431)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 9.51273  (9.51273)
     | > current_lr: 0.00006 
     | > step_time: 1.03990  (1.03995)
     | > loader_time: 0.42540  (0.42539)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.45388 [0m(-0.02537)
     | > avg_log_mle:[92m -0.23881 [0m(-0.00558)
     | > avg_loss_dur:[92m 0.69269 [0m(-0.01979)


[4m[1m > EPOCH: 259/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:05:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.42111 [0m(-0.03277)
     | > avg_log_mle:[92m -0.24424 [0m(-0.00543)
     | > avg_loss_dur:[92m 0.66534 [0m(-0.02735)


[4m[1m > EPOCH: 260/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:05:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.44210 [0m(+0.02099)
     | > avg_log_mle:[91m -0.24171 [0m(+0.00253)
     | > avg_loss_dur:[91m 0.68381 [0m(+0.01846)


[4m[1m > EPOCH: 261/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:06:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.35147 [0m(-0.09063)
     | > avg_log_mle:[91m -0.24122 [0m(+0.00049)
     | > avg_loss_dur:[92m 0.59269 [0m(-0.09112)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_786.pth

[4m[1m > EPOCH: 262/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:06:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.35739 [0m(+0.00592)
     | > avg_log_mle:[92m -0.24416 [0m(-0.00294)
     | > avg_loss_dur:[91m 0.60155 [0m(+0.00886)


[4m[1m > EPOCH: 263/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:06:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.46647 [0m(+0.10907)
     | > avg_log_mle:[91m -0.24002 [0m(+0.00414)
     | > avg_loss_dur:[91m 0.70648 [0m(+0.10494)


[4m[1m > EPOCH: 264/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:06:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.40665 [0m(-0.05981)
     | > avg_log_mle:[92m -0.24246 [0m(-0.00244)
     | > avg_loss_dur:[92m 0.64911 [0m(-0.05737)


[4m[1m > EPOCH: 265/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:06:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.50076 [0m(+0.09410)
     | > avg_log_mle:[91m -0.23707 [0m(+0.00539)
     | > avg_loss_dur:[91m 0.73783 [0m(+0.08872)


[4m[1m > EPOCH: 266/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:06:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 800[0m
     | > loss: 0.06310  (0.08315)
     | > log_mle: -0.29734  (-0.25058)
     | > loss_dur: 0.36044  (0.33373)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.41684  (8.14717)
     | > current_lr: 0.00007 
     | > step_time: 0.40040  (0.72367)
     | > loader_time: 0.10310  (0.26374)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.45392 [0m(-0.04683)
     | > avg_log_mle:[92m -0.24525 [0m(-0.00818)
     | > avg_loss_dur:[92m 0.69918 [0m(-0.03865)


[4m[1m > EPOCH: 267/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:07:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.45067 [0m(-0.00326)
     | > avg_log_mle:[92m -0.25209 [0m(-0.00684)
     | > avg_loss_dur:[91m 0.70276 [0m(+0.00358)


[4m[1m > EPOCH: 268/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:07:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.43671 [0m(-0.01395)
     | > avg_log_mle:[91m -0.24454 [0m(+0.00756)
     | > avg_loss_dur:[92m 0.68125 [0m(-0.02151)


[4m[1m > EPOCH: 269/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:07:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.40166 [0m(-0.03505)
     | > avg_log_mle:[92m -0.24788 [0m(-0.00335)
     | > avg_loss_dur:[92m 0.64955 [0m(-0.03170)


[4m[1m > EPOCH: 270/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:07:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.42652 [0m(+0.02486)
     | > avg_log_mle:[92m -0.25128 [0m(-0.00340)
     | > avg_loss_dur:[91m 0.67781 [0m(+0.02826)


[4m[1m > EPOCH: 271/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:07:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.36643 [0m(-0.06009)
     | > avg_log_mle:[91m -0.24533 [0m(+0.00596)
     | > avg_loss_dur:[92m 0.61175 [0m(-0.06605)


[4m[1m > EPOCH: 272/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:07:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.43964 [0m(+0.07321)
     | > avg_log_mle:[92m -0.25679 [0m(-0.01146)
     | > avg_loss_dur:[91m 0.69643 [0m(+0.08467)


[4m[1m > EPOCH: 273/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:07:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.38113 [0m(-0.05851)
     | > avg_log_mle:[91m -0.24747 [0m(+0.00931)
     | > avg_loss_dur:[92m 0.62861 [0m(-0.06782)


[4m[1m > EPOCH: 274/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:08:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.45652 [0m(+0.07539)
     | > avg_log_mle:[91m -0.24677 [0m(+0.00070)
     | > avg_loss_dur:[91m 0.70329 [0m(+0.07468)


[4m[1m > EPOCH: 275/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:08:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 825[0m
     | > loss: 0.03926  (0.03926)
     | > log_mle: -0.23847  (-0.23847)
     | > loss_dur: 0.27773  (0.27773)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 14.69215  (14.69215)
     | > current_lr: 0.00007 
     | > step_time: 0.72570  (0.72566)
     | > loader_time: 0.33030  (0.33030)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.40964 [0m(-0.04688)
     | > avg_log_mle:[92m -0.25553 [0m(-0.00876)
     | > avg_loss_dur:[92m 0.66516 [0m(-0.03812)


[4m[1m > EPOCH: 276/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:08:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.44547 [0m(+0.03583)
     | > avg_log_mle:[91m -0.23501 [0m(+0.02051)
     | > avg_loss_dur:[91m 0.68048 [0m(+0.01532)


[4m[1m > EPOCH: 277/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:08:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.46162 [0m(+0.01615)
     | > avg_log_mle:[92m -0.24525 [0m(-0.01024)
     | > avg_loss_dur:[91m 0.70687 [0m(+0.02639)


[4m[1m > EPOCH: 278/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:08:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.43560 [0m(-0.02601)
     | > avg_log_mle:[91m -0.23623 [0m(+0.00902)
     | > avg_loss_dur:[92m 0.67184 [0m(-0.03503)


[4m[1m > EPOCH: 279/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:08:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.41535 [0m(-0.02025)
     | > avg_log_mle:[92m -0.26440 [0m(-0.02817)
     | > avg_loss_dur:[91m 0.67975 [0m(+0.00791)


[4m[1m > EPOCH: 280/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:09:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.45359 [0m(+0.03824)
     | > avg_log_mle:[91m -0.24863 [0m(+0.01577)
     | > avg_loss_dur:[91m 0.70222 [0m(+0.02247)


[4m[1m > EPOCH: 281/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:09:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.42332 [0m(-0.03027)
     | > avg_log_mle:[92m -0.25311 [0m(-0.00448)
     | > avg_loss_dur:[92m 0.67643 [0m(-0.02578)


[4m[1m > EPOCH: 282/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:09:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.38184 [0m(-0.04148)
     | > avg_log_mle:[91m -0.24951 [0m(+0.00360)
     | > avg_loss_dur:[92m 0.63135 [0m(-0.04508)


[4m[1m > EPOCH: 283/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:09:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 850[0m
     | > loss: 0.08570  (0.08570)
     | > log_mle: -0.22332  (-0.22332)
     | > loss_dur: 0.30903  (0.30903)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.86595  (13.86595)
     | > current_lr: 0.00007 
     | > step_time: 1.03290  (1.03294)
     | > loader_time: 0.42240  (0.42238)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.43928 [0m(+0.05743)
     | > avg_log_mle:[91m -0.23748 [0m(+0.01203)
     | > avg_loss_dur:[91m 0.67676 [0m(+0.04541)


[4m[1m > EPOCH: 284/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:09:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.46346 [0m(+0.02419)
     | > avg_log_mle:[92m -0.23954 [0m(-0.00206)
     | > avg_loss_dur:[91m 0.70301 [0m(+0.02625)


[4m[1m > EPOCH: 285/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:09:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.38813 [0m(-0.07534)
     | > avg_log_mle:[92m -0.25352 [0m(-0.01398)
     | > avg_loss_dur:[92m 0.64165 [0m(-0.06136)


[4m[1m > EPOCH: 286/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:09:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.43561 [0m(+0.04748)
     | > avg_log_mle:[91m -0.24181 [0m(+0.01172)
     | > avg_loss_dur:[91m 0.67742 [0m(+0.03577)


[4m[1m > EPOCH: 287/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:10:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.43621 [0m(+0.00060)
     | > avg_log_mle:[92m -0.26274 [0m(-0.02093)
     | > avg_loss_dur:[91m 0.69894 [0m(+0.02153)


[4m[1m > EPOCH: 288/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:10:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.39865 [0m(-0.03755)
     | > avg_log_mle:[91m -0.25371 [0m(+0.00903)
     | > avg_loss_dur:[92m 0.65236 [0m(-0.04659)


[4m[1m > EPOCH: 289/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:10:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.37306 [0m(-0.02559)
     | > avg_log_mle:[92m -0.26615 [0m(-0.01245)
     | > avg_loss_dur:[92m 0.63921 [0m(-0.01314)


[4m[1m > EPOCH: 290/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:10:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.40324 [0m(+0.03018)
     | > avg_log_mle:[92m -0.26816 [0m(-0.00200)
     | > avg_loss_dur:[91m 0.67140 [0m(+0.03218)


[4m[1m > EPOCH: 291/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:10:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 875[0m
     | > loss: 0.03019  (0.06034)
     | > log_mle: -0.32622  (-0.27696)
     | > loss_dur: 0.35641  (0.33730)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.38343  (10.34642)
     | > current_lr: 0.00007 
     | > step_time: 0.40040  (0.71849)
     | > loader_time: 0.10010  (0.26024)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.38234 [0m(-0.02091)
     | > avg_log_mle:[91m -0.26251 [0m(+0.00564)
     | > avg_loss_dur:[92m 0.64485 [0m(-0.02655)


[4m[1m > EPOCH: 292/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:10:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.43211 [0m(+0.04978)
     | > avg_log_mle:[92m -0.26988 [0m(-0.00736)
     | > avg_loss_dur:[91m 0.70199 [0m(+0.05714)


[4m[1m > EPOCH: 293/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:11:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.40328 [0m(-0.02884)
     | > avg_log_mle:[91m -0.26603 [0m(+0.00385)
     | > avg_loss_dur:[92m 0.66931 [0m(-0.03268)


[4m[1m > EPOCH: 294/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:11:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.39366 [0m(-0.00962)
     | > avg_log_mle:[92m -0.27440 [0m(-0.00837)
     | > avg_loss_dur:[92m 0.66806 [0m(-0.00125)


[4m[1m > EPOCH: 295/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:11:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.35529 [0m(-0.03837)
     | > avg_log_mle:[91m -0.26979 [0m(+0.00460)
     | > avg_loss_dur:[92m 0.62508 [0m(-0.04297)


[4m[1m > EPOCH: 296/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:11:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.38731 [0m(+0.03202)
     | > avg_log_mle:[91m -0.26916 [0m(+0.00063)
     | > avg_loss_dur:[91m 0.65647 [0m(+0.03139)


[4m[1m > EPOCH: 297/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:11:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.40259 [0m(+0.01528)
     | > avg_log_mle:[91m -0.26164 [0m(+0.00753)
     | > avg_loss_dur:[91m 0.66423 [0m(+0.00776)


[4m[1m > EPOCH: 298/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:11:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.40129 [0m(-0.00130)
     | > avg_log_mle:[92m -0.27080 [0m(-0.00916)
     | > avg_loss_dur:[91m 0.67209 [0m(+0.00786)


[4m[1m > EPOCH: 299/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:11:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.40634 [0m(+0.00505)
     | > avg_log_mle:[91m -0.26995 [0m(+0.00084)
     | > avg_loss_dur:[91m 0.67629 [0m(+0.00421)


[4m[1m > EPOCH: 300/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:12:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 900[0m
     | > loss: 0.00821  (0.00821)
     | > log_mle: -0.26675  (-0.26675)
     | > loss_dur: 0.27495  (0.27495)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 21.33456  (21.33456)
     | > current_lr: 0.00007 
     | > step_time: 0.72570  (0.72567)
     | > loader_time: 0.31430  (0.31428)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.39403 [0m(-0.01231)
     | > avg_log_mle:[92m -0.27449 [0m(-0.00453)
     | > avg_loss_dur:[92m 0.66852 [0m(-0.00778)


[4m[1m > EPOCH: 301/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:12:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.42400 [0m(+0.02997)
     | > avg_log_mle:[91m -0.26257 [0m(+0.01192)
     | > avg_loss_dur:[91m 0.68657 [0m(+0.01805)


[4m[1m > EPOCH: 302/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:12:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.38164 [0m(-0.04235)
     | > avg_log_mle:[92m -0.27552 [0m(-0.01295)
     | > avg_loss_dur:[92m 0.65716 [0m(-0.02941)


[4m[1m > EPOCH: 303/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:12:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.39493 [0m(+0.01329)
     | > avg_log_mle:[91m -0.25057 [0m(+0.02495)
     | > avg_loss_dur:[92m 0.64550 [0m(-0.01166)


[4m[1m > EPOCH: 304/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:12:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.44243 [0m(+0.04750)
     | > avg_log_mle:[92m -0.26638 [0m(-0.01581)
     | > avg_loss_dur:[91m 0.70881 [0m(+0.06331)


[4m[1m > EPOCH: 305/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:12:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.41189 [0m(-0.03055)
     | > avg_log_mle:[91m -0.24619 [0m(+0.02019)
     | > avg_loss_dur:[92m 0.65808 [0m(-0.05073)


[4m[1m > EPOCH: 306/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:13:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.41157 [0m(-0.00031)
     | > avg_log_mle:[92m -0.26444 [0m(-0.01825)
     | > avg_loss_dur:[91m 0.67601 [0m(+0.01794)


[4m[1m > EPOCH: 307/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:13:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.42602 [0m(+0.01444)
     | > avg_log_mle:[91m -0.25979 [0m(+0.00465)
     | > avg_loss_dur:[91m 0.68581 [0m(+0.00979)


[4m[1m > EPOCH: 308/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:13:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 925[0m
     | > loss: 0.09038  (0.09038)
     | > log_mle: -0.23138  (-0.23138)
     | > loss_dur: 0.32175  (0.32175)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 20.05393  (20.05393)
     | > current_lr: 0.00008 
     | > step_time: 1.03490  (1.03494)
     | > loader_time: 0.42140  (0.42138)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.37353 [0m(-0.05248)
     | > avg_log_mle:[91m -0.24755 [0m(+0.01225)
     | > avg_loss_dur:[92m 0.62108 [0m(-0.06473)


[4m[1m > EPOCH: 309/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:13:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39154 [0m(+0.01800)
     | > avg_log_mle:[92m -0.27054 [0m(-0.02299)
     | > avg_loss_dur:[91m 0.66207 [0m(+0.04099)


[4m[1m > EPOCH: 310/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:13:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.36381 [0m(-0.02772)
     | > avg_log_mle:[92m -0.27122 [0m(-0.00068)
     | > avg_loss_dur:[92m 0.63503 [0m(-0.02704)


[4m[1m > EPOCH: 311/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:13:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.44068 [0m(+0.07686)
     | > avg_log_mle:[92m -0.27155 [0m(-0.00033)
     | > avg_loss_dur:[91m 0.71223 [0m(+0.07720)


[4m[1m > EPOCH: 312/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:14:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 0.39155 [0m(-0.04913)
     | > avg_log_mle:[92m -0.28243 [0m(-0.01088)
     | > avg_loss_dur:[92m 0.67398 [0m(-0.03825)


[4m[1m > EPOCH: 313/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:14:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[91m 0.41002 [0m(+0.01847)
     | > avg_log_mle:[91m -0.27102 [0m(+0.01141)
     | > avg_loss_dur:[91m 0.68104 [0m(+0.00706)


[4m[1m > EPOCH: 314/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:14:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.41405 [0m(+0.00403)
     | > avg_log_mle:[92m -0.28445 [0m(-0.01344)
     | > avg_loss_dur:[91m 0.69850 [0m(+0.01746)


[4m[1m > EPOCH: 315/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:14:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.42416 [0m(+0.01012)
     | > avg_log_mle:[91m -0.28125 [0m(+0.00321)
     | > avg_loss_dur:[91m 0.70541 [0m(+0.00691)


[4m[1m > EPOCH: 316/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:14:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 950[0m
     | > loss: 0.00547  (0.03025)
     | > log_mle: -0.35229  (-0.30107)
     | > loss_dur: 0.35775  (0.33132)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.90671  (11.91228)
     | > current_lr: 0.00008 
     | > step_time: 0.40440  (0.71716)
     | > loader_time: 0.10810  (0.26473)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.41512 [0m(-0.00904)
     | > avg_log_mle:[92m -0.28504 [0m(-0.00380)
     | > avg_loss_dur:[92m 0.70017 [0m(-0.00524)


[4m[1m > EPOCH: 317/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:14:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.39778 [0m(-0.01735)
     | > avg_log_mle:[91m -0.28129 [0m(+0.00376)
     | > avg_loss_dur:[92m 0.67906 [0m(-0.02110)


[4m[1m > EPOCH: 318/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:14:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.36545 [0m(-0.03233)
     | > avg_log_mle:[92m -0.28787 [0m(-0.00659)
     | > avg_loss_dur:[92m 0.65332 [0m(-0.02574)


[4m[1m > EPOCH: 319/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:15:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.43042 [0m(+0.06497)
     | > avg_log_mle:[91m -0.27997 [0m(+0.00791)
     | > avg_loss_dur:[91m 0.71039 [0m(+0.05707)


[4m[1m > EPOCH: 320/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:15:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.38067 [0m(-0.04976)
     | > avg_log_mle:[92m -0.28885 [0m(-0.00888)
     | > avg_loss_dur:[92m 0.66952 [0m(-0.04087)


[4m[1m > EPOCH: 321/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:15:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.35089 [0m(-0.02978)
     | > avg_log_mle:[91m -0.27855 [0m(+0.01030)
     | > avg_loss_dur:[92m 0.62943 [0m(-0.04008)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_966.pth

[4m[1m > EPOCH: 322/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:15:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.38572 [0m(+0.03483)
     | > avg_log_mle:[91m -0.27795 [0m(+0.00060)
     | > avg_loss_dur:[91m 0.66367 [0m(+0.03424)


[4m[1m > EPOCH: 323/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:15:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.35433 [0m(-0.03139)
     | > avg_log_mle:[92m -0.27917 [0m(-0.00122)
     | > avg_loss_dur:[92m 0.63350 [0m(-0.03017)


[4m[1m > EPOCH: 324/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:15:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.44593 [0m(+0.09160)
     | > avg_log_mle:[92m -0.28332 [0m(-0.00415)
     | > avg_loss_dur:[91m 0.72925 [0m(+0.09575)


[4m[1m > EPOCH: 325/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:16:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 975[0m
     | > loss: -0.01277  (-0.01277)
     | > log_mle: -0.28834  (-0.28834)
     | > loss_dur: 0.27557  (0.27557)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.27302  (11.27302)
     | > current_lr: 0.00008 
     | > step_time: 0.72570  (0.72566)
     | > loader_time: 0.32830  (0.32829)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.41622 [0m(-0.02970)
     | > avg_log_mle:[91m -0.26834 [0m(+0.01498)
     | > avg_loss_dur:[92m 0.68457 [0m(-0.04468)


[4m[1m > EPOCH: 326/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:16:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.36105 [0m(-0.05517)
     | > avg_log_mle:[92m -0.28746 [0m(-0.01912)
     | > avg_loss_dur:[92m 0.64851 [0m(-0.03606)


[4m[1m > EPOCH: 327/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:16:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39644 [0m(+0.03540)
     | > avg_log_mle:[91m -0.28453 [0m(+0.00293)
     | > avg_loss_dur:[91m 0.68098 [0m(+0.03247)


[4m[1m > EPOCH: 328/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:16:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.42431 [0m(+0.02787)
     | > avg_log_mle:[91m -0.27972 [0m(+0.00481)
     | > avg_loss_dur:[91m 0.70403 [0m(+0.02306)


[4m[1m > EPOCH: 329/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:16:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.43983 [0m(+0.01552)
     | > avg_log_mle:[92m -0.29117 [0m(-0.01145)
     | > avg_loss_dur:[91m 0.73100 [0m(+0.02697)


[4m[1m > EPOCH: 330/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:16:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.37730 [0m(-0.06253)
     | > avg_log_mle:[91m -0.28432 [0m(+0.00685)
     | > avg_loss_dur:[92m 0.66162 [0m(-0.06939)


[4m[1m > EPOCH: 331/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:16:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39871 [0m(+0.02141)
     | > avg_log_mle:[92m -0.28678 [0m(-0.00246)
     | > avg_loss_dur:[91m 0.68549 [0m(+0.02387)


[4m[1m > EPOCH: 332/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:17:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.44128 [0m(+0.04257)
     | > avg_log_mle:[91m -0.27070 [0m(+0.01608)
     | > avg_loss_dur:[91m 0.71198 [0m(+0.02650)


[4m[1m > EPOCH: 333/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:17:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1000[0m
     | > loss: 0.04547  (0.04547)
     | > log_mle: -0.26283  (-0.26283)
     | > loss_dur: 0.30829  (0.30829)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.96669  (12.96669)
     | > current_lr: 0.00008 
     | > step_time: 1.03690  (1.03694)
     | > loader_time: 0.41940  (0.41938)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.41300 [0m(-0.02828)
     | > avg_log_mle:[92m -0.28916 [0m(-0.01846)
     | > avg_loss_dur:[92m 0.70216 [0m(-0.00983)


[4m[1m > EPOCH: 334/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:17:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 0.36716 [0m(-0.04584)
     | > avg_log_mle:[91m -0.28015 [0m(+0.00901)
     | > avg_loss_dur:[92m 0.64731 [0m(-0.05485)


[4m[1m > EPOCH: 335/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:17:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[91m 0.38212 [0m(+0.01496)
     | > avg_log_mle:[92m -0.28967 [0m(-0.00953)
     | > avg_loss_dur:[91m 0.67179 [0m(+0.02448)


[4m[1m > EPOCH: 336/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:17:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 0.37060 [0m(-0.01152)
     | > avg_log_mle:[91m -0.28092 [0m(+0.00876)
     | > avg_loss_dur:[92m 0.65152 [0m(-0.02027)


[4m[1m > EPOCH: 337/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:17:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.40518 [0m(+0.03458)
     | > avg_log_mle:[91m -0.27823 [0m(+0.00268)
     | > avg_loss_dur:[91m 0.68341 [0m(+0.03189)


[4m[1m > EPOCH: 338/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:18:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.36710 [0m(-0.03808)
     | > avg_log_mle:[92m -0.29875 [0m(-0.02051)
     | > avg_loss_dur:[92m 0.66584 [0m(-0.01757)


[4m[1m > EPOCH: 339/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:18:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.41102 [0m(+0.04392)
     | > avg_log_mle:[91m -0.28152 [0m(+0.01723)
     | > avg_loss_dur:[91m 0.69254 [0m(+0.02669)


[4m[1m > EPOCH: 340/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:18:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.38890 [0m(-0.02211)
     | > avg_log_mle:[92m -0.29837 [0m(-0.01686)
     | > avg_loss_dur:[92m 0.68728 [0m(-0.00526)


[4m[1m > EPOCH: 341/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:18:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1025[0m
     | > loss: -0.01181  (0.01157)
     | > log_mle: -0.37521  (-0.32405)
     | > loss_dur: 0.36340  (0.33562)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 25.24241  (20.82376)
     | > current_lr: 0.00009 
     | > step_time: 0.40440  (0.71915)
     | > loader_time: 0.10410  (0.26124)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.41876 [0m(+0.02986)
     | > avg_log_mle:[91m -0.29158 [0m(+0.00679)
     | > avg_loss_dur:[91m 0.71034 [0m(+0.02306)


[4m[1m > EPOCH: 342/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:18:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.40112 [0m(-0.01764)
     | > avg_log_mle:[92m -0.29257 [0m(-0.00099)
     | > avg_loss_dur:[92m 0.69369 [0m(-0.01665)


[4m[1m > EPOCH: 343/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:18:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.40743 [0m(+0.00631)
     | > avg_log_mle:[91m -0.29230 [0m(+0.00027)
     | > avg_loss_dur:[91m 0.69972 [0m(+0.00603)


[4m[1m > EPOCH: 344/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:18:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 0.37136 [0m(-0.03607)
     | > avg_log_mle:[92m -0.29250 [0m(-0.00020)
     | > avg_loss_dur:[92m 0.66385 [0m(-0.03587)


[4m[1m > EPOCH: 345/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:19:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[92m 0.36521 [0m(-0.00614)
     | > avg_log_mle:[92m -0.29840 [0m(-0.00590)
     | > avg_loss_dur:[92m 0.66361 [0m(-0.00025)


[4m[1m > EPOCH: 346/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:19:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.41220 [0m(+0.04699)
     | > avg_log_mle:[91m -0.28649 [0m(+0.01191)
     | > avg_loss_dur:[91m 0.69869 [0m(+0.03508)


[4m[1m > EPOCH: 347/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:19:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.41117 [0m(-0.00103)
     | > avg_log_mle:[92m -0.30144 [0m(-0.01495)
     | > avg_loss_dur:[91m 0.71261 [0m(+0.01392)


[4m[1m > EPOCH: 348/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:19:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.35082 [0m(-0.06035)
     | > avg_log_mle:[91m -0.29613 [0m(+0.00531)
     | > avg_loss_dur:[92m 0.64695 [0m(-0.06566)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_1047.pth

[4m[1m > EPOCH: 349/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:19:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.39517 [0m(+0.04435)
     | > avg_log_mle:[92m -0.30058 [0m(-0.00445)
     | > avg_loss_dur:[91m 0.69575 [0m(+0.04880)


[4m[1m > EPOCH: 350/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:19:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1050[0m
     | > loss: -0.03393  (-0.03393)
     | > log_mle: -0.30969  (-0.30969)
     | > loss_dur: 0.27577  (0.27577)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.27832  (10.27832)
     | > current_lr: 0.00009 
     | > step_time: 0.72670  (0.72666)
     | > loader_time: 0.31730  (0.31729)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.41094 [0m(+0.01576)
     | > avg_log_mle:[91m -0.29666 [0m(+0.00391)
     | > avg_loss_dur:[91m 0.70760 [0m(+0.01185)


[4m[1m > EPOCH: 351/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:20:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.41423 [0m(+0.00329)
     | > avg_log_mle:[92m -0.30265 [0m(-0.00599)
     | > avg_loss_dur:[91m 0.71688 [0m(+0.00928)


[4m[1m > EPOCH: 352/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:20:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.39060 [0m(-0.02363)
     | > avg_log_mle:[92m -0.30329 [0m(-0.00064)
     | > avg_loss_dur:[92m 0.69389 [0m(-0.02299)


[4m[1m > EPOCH: 353/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:20:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.39957 [0m(+0.00898)
     | > avg_log_mle:[91m -0.30087 [0m(+0.00242)
     | > avg_loss_dur:[91m 0.70044 [0m(+0.00655)


[4m[1m > EPOCH: 354/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:20:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.41923 [0m(+0.01966)
     | > avg_log_mle:[91m -0.29441 [0m(+0.00646)
     | > avg_loss_dur:[91m 0.71365 [0m(+0.01320)


[4m[1m > EPOCH: 355/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:20:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.37607 [0m(-0.04317)
     | > avg_log_mle:[92m -0.30263 [0m(-0.00822)
     | > avg_loss_dur:[92m 0.67870 [0m(-0.03495)


[4m[1m > EPOCH: 356/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:20:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.42070 [0m(+0.04463)
     | > avg_log_mle:[91m -0.30193 [0m(+0.00071)
     | > avg_loss_dur:[91m 0.72263 [0m(+0.04393)


[4m[1m > EPOCH: 357/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:20:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.38971 [0m(-0.03099)
     | > avg_log_mle:[92m -0.30476 [0m(-0.00284)
     | > avg_loss_dur:[92m 0.69447 [0m(-0.02816)


[4m[1m > EPOCH: 358/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:21:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1075[0m
     | > loss: 0.02276  (0.02276)
     | > log_mle: -0.28296  (-0.28296)
     | > loss_dur: 0.30572  (0.30572)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 19.66638  (19.66638)
     | > current_lr: 0.00009 
     | > step_time: 1.04100  (1.04096)
     | > loader_time: 0.43940  (0.43939)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.39988 [0m(+0.01017)
     | > avg_log_mle:[91m -0.30345 [0m(+0.00132)
     | > avg_loss_dur:[91m 0.70333 [0m(+0.00885)


[4m[1m > EPOCH: 359/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:21:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.40687 [0m(+0.00699)
     | > avg_log_mle:[92m -0.30437 [0m(-0.00093)
     | > avg_loss_dur:[91m 0.71124 [0m(+0.00791)


[4m[1m > EPOCH: 360/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:21:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.36705 [0m(-0.03982)
     | > avg_log_mle:[91m -0.29771 [0m(+0.00667)
     | > avg_loss_dur:[92m 0.66476 [0m(-0.04648)


[4m[1m > EPOCH: 361/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:21:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.37183 [0m(+0.00478)
     | > avg_log_mle:[92m -0.30462 [0m(-0.00691)
     | > avg_loss_dur:[91m 0.67645 [0m(+0.01169)


[4m[1m > EPOCH: 362/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:21:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.41708 [0m(+0.04525)
     | > avg_log_mle:[91m -0.30137 [0m(+0.00325)
     | > avg_loss_dur:[91m 0.71845 [0m(+0.04200)


[4m[1m > EPOCH: 363/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:21:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.37747 [0m(-0.03961)
     | > avg_log_mle:[92m -0.30535 [0m(-0.00398)
     | > avg_loss_dur:[92m 0.68282 [0m(-0.03562)


[4m[1m > EPOCH: 364/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:22:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.38503 [0m(+0.00756)
     | > avg_log_mle:[91m -0.30243 [0m(+0.00292)
     | > avg_loss_dur:[91m 0.68746 [0m(+0.00464)


[4m[1m > EPOCH: 365/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:22:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39085 [0m(+0.00582)
     | > avg_log_mle:[91m -0.30129 [0m(+0.00114)
     | > avg_loss_dur:[91m 0.69215 [0m(+0.00468)


[4m[1m > EPOCH: 366/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:22:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1100[0m
     | > loss: -0.04327  (-0.00857)
     | > log_mle: -0.40069  (-0.34441)
     | > loss_dur: 0.35742  (0.33584)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 14.17171  (13.53457)
     | > current_lr: 0.00009 
     | > step_time: 0.40240  (0.72016)
     | > loader_time: 0.10110  (0.25773)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.41143 [0m(+0.02058)
     | > avg_log_mle:[92m -0.30698 [0m(-0.00568)
     | > avg_loss_dur:[91m 0.71841 [0m(+0.02626)


[4m[1m > EPOCH: 367/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:22:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.39430 [0m(-0.01713)
     | > avg_log_mle:[91m -0.30158 [0m(+0.00539)
     | > avg_loss_dur:[92m 0.69588 [0m(-0.02253)


[4m[1m > EPOCH: 368/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:22:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.42334 [0m(+0.02904)
     | > avg_log_mle:[91m -0.28759 [0m(+0.01400)
     | > avg_loss_dur:[91m 0.71093 [0m(+0.01504)


[4m[1m > EPOCH: 369/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:22:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.39731 [0m(-0.02603)
     | > avg_log_mle:[92m -0.29620 [0m(-0.00861)
     | > avg_loss_dur:[92m 0.69351 [0m(-0.01742)


[4m[1m > EPOCH: 370/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:22:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.35014 [0m(-0.04717)
     | > avg_log_mle:[92m -0.30878 [0m(-0.01258)
     | > avg_loss_dur:[92m 0.65892 [0m(-0.03459)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_1113.pth

[4m[1m > EPOCH: 371/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:23:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.37732 [0m(+0.02718)
     | > avg_log_mle:[91m -0.30814 [0m(+0.00064)
     | > avg_loss_dur:[91m 0.68546 [0m(+0.02654)


[4m[1m > EPOCH: 372/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:23:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.38910 [0m(+0.01178)
     | > avg_log_mle:[92m -0.31166 [0m(-0.00352)
     | > avg_loss_dur:[91m 0.70075 [0m(+0.01530)


[4m[1m > EPOCH: 373/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:23:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[91m 0.39283 [0m(+0.00373)
     | > avg_log_mle:[91m -0.30759 [0m(+0.00407)
     | > avg_loss_dur:[92m 0.70042 [0m(-0.00034)


[4m[1m > EPOCH: 374/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:23:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[92m 0.38792 [0m(-0.00491)
     | > avg_log_mle:[92m -0.30866 [0m(-0.00108)
     | > avg_loss_dur:[92m 0.69658 [0m(-0.00384)


[4m[1m > EPOCH: 375/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:23:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1125[0m
     | > loss: -0.05238  (-0.05238)
     | > log_mle: -0.32800  (-0.32800)
     | > loss_dur: 0.27563  (0.27563)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 18.73853  (18.73853)
     | > current_lr: 0.00009 
     | > step_time: 0.73070  (0.73067)
     | > loader_time: 0.31730  (0.31729)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39741 [0m(+0.00950)
     | > avg_log_mle:[91m -0.29301 [0m(+0.01565)
     | > avg_loss_dur:[92m 0.69043 [0m(-0.00615)


[4m[1m > EPOCH: 376/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:23:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[91m 0.43351 [0m(+0.03610)
     | > avg_log_mle:[91m -0.28591 [0m(+0.00710)
     | > avg_loss_dur:[91m 0.71942 [0m(+0.02900)


[4m[1m > EPOCH: 377/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:24:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[91m 0.44184 [0m(+0.00833)
     | > avg_log_mle:[91m -0.25080 [0m(+0.03512)
     | > avg_loss_dur:[92m 0.69264 [0m(-0.02678)


[4m[1m > EPOCH: 378/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:24:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.45958 [0m(+0.01774)
     | > avg_log_mle:[92m -0.25428 [0m(-0.00348)
     | > avg_loss_dur:[91m 0.71386 [0m(+0.02122)


[4m[1m > EPOCH: 379/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:24:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 0.43933 [0m(-0.02025)
     | > avg_log_mle:[92m -0.25471 [0m(-0.00043)
     | > avg_loss_dur:[92m 0.69404 [0m(-0.01982)


[4m[1m > EPOCH: 380/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:24:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.43632 [0m(-0.00300)
     | > avg_log_mle:[92m -0.25718 [0m(-0.00247)
     | > avg_loss_dur:[92m 0.69350 [0m(-0.00054)


[4m[1m > EPOCH: 381/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:24:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.38808 [0m(-0.04824)
     | > avg_log_mle:[92m -0.26976 [0m(-0.01258)
     | > avg_loss_dur:[92m 0.65784 [0m(-0.03566)


[4m[1m > EPOCH: 382/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:24:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.35829 [0m(-0.02980)
     | > avg_log_mle:[92m -0.28441 [0m(-0.01465)
     | > avg_loss_dur:[92m 0.64270 [0m(-0.01514)


[4m[1m > EPOCH: 383/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:24:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1150[0m
     | > loss: 0.03669  (0.03669)
     | > log_mle: -0.28079  (-0.28079)
     | > loss_dur: 0.31748  (0.31748)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 16.42880  (16.42880)
     | > current_lr: 0.00010 
     | > step_time: 1.03490  (1.03494)
     | > loader_time: 0.42240  (0.42238)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.46824 [0m(+0.10995)
     | > avg_log_mle:[91m -0.25850 [0m(+0.02591)
     | > avg_loss_dur:[91m 0.72674 [0m(+0.08404)


[4m[1m > EPOCH: 384/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:25:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.40299 [0m(-0.06525)
     | > avg_log_mle:[92m -0.28730 [0m(-0.02880)
     | > avg_loss_dur:[92m 0.69028 [0m(-0.03646)


[4m[1m > EPOCH: 385/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:25:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.41104 [0m(+0.00806)
     | > avg_log_mle:[92m -0.29042 [0m(-0.00312)
     | > avg_loss_dur:[91m 0.70146 [0m(+0.01118)


[4m[1m > EPOCH: 386/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:25:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 0.37169 [0m(-0.03935)
     | > avg_log_mle:[92m -0.30213 [0m(-0.01172)
     | > avg_loss_dur:[92m 0.67382 [0m(-0.02764)


[4m[1m > EPOCH: 387/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:25:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.40283 [0m(+0.03113)
     | > avg_log_mle:[92m -0.30311 [0m(-0.00098)
     | > avg_loss_dur:[91m 0.70593 [0m(+0.03211)


[4m[1m > EPOCH: 388/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:25:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.38022 [0m(-0.02261)
     | > avg_log_mle:[91m -0.28757 [0m(+0.01554)
     | > avg_loss_dur:[92m 0.66779 [0m(-0.03814)


[4m[1m > EPOCH: 389/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:25:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.37327 [0m(-0.00695)
     | > avg_log_mle:[92m -0.30196 [0m(-0.01439)
     | > avg_loss_dur:[91m 0.67523 [0m(+0.00744)


[4m[1m > EPOCH: 390/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:26:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.41508 [0m(+0.04182)
     | > avg_log_mle:[92m -0.30409 [0m(-0.00213)
     | > avg_loss_dur:[91m 0.71917 [0m(+0.04395)


[4m[1m > EPOCH: 391/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:26:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1175[0m
     | > loss: -0.04867  (-0.01000)
     | > log_mle: -0.40610  (-0.34988)
     | > loss_dur: 0.35743  (0.33989)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 12.94874  (20.55795)
     | > current_lr: 0.00010 
     | > step_time: 0.40340  (0.71966)
     | > loader_time: 0.10610  (0.26173)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.39557 [0m(-0.01952)
     | > avg_log_mle:[92m -0.31049 [0m(-0.00640)
     | > avg_loss_dur:[92m 0.70606 [0m(-0.01311)


[4m[1m > EPOCH: 392/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:26:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.42777 [0m(+0.03220)
     | > avg_log_mle:[91m -0.29223 [0m(+0.01826)
     | > avg_loss_dur:[91m 0.72000 [0m(+0.01395)


[4m[1m > EPOCH: 393/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:26:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.49966 [0m(+0.07188)
     | > avg_log_mle:[91m -0.23859 [0m(+0.05364)
     | > avg_loss_dur:[91m 0.73825 [0m(+0.01824)


[4m[1m > EPOCH: 394/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:26:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 0.41485 [0m(-0.08481)
     | > avg_log_mle:[92m -0.26852 [0m(-0.02993)
     | > avg_loss_dur:[92m 0.68337 [0m(-0.05487)


[4m[1m > EPOCH: 395/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:26:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.41339 [0m(-0.00146)
     | > avg_log_mle:[92m -0.29511 [0m(-0.02659)
     | > avg_loss_dur:[91m 0.70850 [0m(+0.02513)


[4m[1m > EPOCH: 396/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:26:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.46379 [0m(+0.05040)
     | > avg_log_mle:[91m -0.28273 [0m(+0.01238)
     | > avg_loss_dur:[91m 0.74653 [0m(+0.03803)


[4m[1m > EPOCH: 397/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:27:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.40432 [0m(-0.05948)
     | > avg_log_mle:[92m -0.30929 [0m(-0.02655)
     | > avg_loss_dur:[92m 0.71361 [0m(-0.03292)


[4m[1m > EPOCH: 398/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:27:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.40145 [0m(-0.00287)
     | > avg_log_mle:[91m -0.28268 [0m(+0.02661)
     | > avg_loss_dur:[92m 0.68413 [0m(-0.02947)


[4m[1m > EPOCH: 399/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:27:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.38585 [0m(-0.01560)
     | > avg_log_mle:[92m -0.31292 [0m(-0.03024)
     | > avg_loss_dur:[91m 0.69877 [0m(+0.01463)


[4m[1m > EPOCH: 400/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:27:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1200[0m
     | > loss: -0.05520  (-0.05520)
     | > log_mle: -0.32929  (-0.32929)
     | > loss_dur: 0.27408  (0.27408)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 21.46383  (21.46383)
     | > current_lr: 0.00010 
     | > step_time: 0.72970  (0.72967)
     | > loader_time: 0.32730  (0.32730)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.36674 [0m(-0.01911)
     | > avg_log_mle:[91m -0.31211 [0m(+0.00081)
     | > avg_loss_dur:[92m 0.67885 [0m(-0.01992)


[4m[1m > EPOCH: 401/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:27:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.40394 [0m(+0.03720)
     | > avg_log_mle:[91m -0.30531 [0m(+0.00680)
     | > avg_loss_dur:[91m 0.70925 [0m(+0.03040)


[4m[1m > EPOCH: 402/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:27:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.42358 [0m(+0.01964)
     | > avg_log_mle:[92m -0.31081 [0m(-0.00550)
     | > avg_loss_dur:[91m 0.73439 [0m(+0.02514)


[4m[1m > EPOCH: 403/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:28:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 0.35419 [0m(-0.06939)
     | > avg_log_mle:[91m -0.30616 [0m(+0.00465)
     | > avg_loss_dur:[92m 0.66035 [0m(-0.07404)


[4m[1m > EPOCH: 404/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:28:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[91m 0.41857 [0m(+0.06438)
     | > avg_log_mle:[91m -0.30145 [0m(+0.00470)
     | > avg_loss_dur:[91m 0.72002 [0m(+0.05968)


[4m[1m > EPOCH: 405/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:28:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00801 [0m(+0.00000)
     | > avg_loss:[92m 0.39793 [0m(-0.02064)
     | > avg_log_mle:[92m -0.31339 [0m(-0.01194)
     | > avg_loss_dur:[92m 0.71132 [0m(-0.00870)


[4m[1m > EPOCH: 406/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:28:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.51351 [0m(+0.11558)
     | > avg_log_mle:[91m -0.28902 [0m(+0.02437)
     | > avg_loss_dur:[91m 0.80253 [0m(+0.09121)


[4m[1m > EPOCH: 407/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:28:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.40992 [0m(-0.10359)
     | > avg_log_mle:[92m -0.31601 [0m(-0.02699)
     | > avg_loss_dur:[92m 0.72594 [0m(-0.07660)


[4m[1m > EPOCH: 408/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:28:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1225[0m
     | > loss: 0.01132  (0.01132)
     | > log_mle: -0.30228  (-0.30228)
     | > loss_dur: 0.31360  (0.31360)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 11.72146  (11.72146)
     | > current_lr: 0.00010 
     | > step_time: 1.03200  (1.03195)
     | > loader_time: 0.42240  (0.42238)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.42048 [0m(+0.01055)
     | > avg_log_mle:[91m -0.30868 [0m(+0.00734)
     | > avg_loss_dur:[91m 0.72915 [0m(+0.00322)


[4m[1m > EPOCH: 409/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:28:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.39949 [0m(-0.02098)
     | > avg_log_mle:[92m -0.31222 [0m(-0.00354)
     | > avg_loss_dur:[92m 0.71171 [0m(-0.01744)


[4m[1m > EPOCH: 410/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:29:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.36072 [0m(-0.03878)
     | > avg_log_mle:[91m -0.29622 [0m(+0.01600)
     | > avg_loss_dur:[92m 0.65694 [0m(-0.05478)


[4m[1m > EPOCH: 411/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:29:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.42140 [0m(+0.06068)
     | > avg_log_mle:[91m -0.29510 [0m(+0.00112)
     | > avg_loss_dur:[91m 0.71650 [0m(+0.05956)


[4m[1m > EPOCH: 412/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:29:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.41956 [0m(-0.00184)
     | > avg_log_mle:[91m -0.28784 [0m(+0.00726)
     | > avg_loss_dur:[92m 0.70739 [0m(-0.00911)


[4m[1m > EPOCH: 413/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:29:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.38870 [0m(-0.03086)
     | > avg_log_mle:[92m -0.30716 [0m(-0.01933)
     | > avg_loss_dur:[92m 0.69586 [0m(-0.01154)


[4m[1m > EPOCH: 414/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:29:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.54644 [0m(+0.15775)
     | > avg_log_mle:[91m -0.26558 [0m(+0.04158)
     | > avg_loss_dur:[91m 0.81202 [0m(+0.11616)


[4m[1m > EPOCH: 415/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:29:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.37949 [0m(-0.16695)
     | > avg_log_mle:[92m -0.31827 [0m(-0.05269)
     | > avg_loss_dur:[92m 0.69776 [0m(-0.11426)


[4m[1m > EPOCH: 416/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:30:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1250[0m
     | > loss: -0.07286  (-0.03868)
     | > log_mle: -0.42544  (-0.36974)
     | > loss_dur: 0.35258  (0.33106)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 17.75146  (15.58634)
     | > current_lr: 0.00010 
     | > step_time: 0.40140  (0.72015)
     | > loader_time: 0.10210  (0.25773)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00801 [0m(+0.00000)
     | > avg_loss:[91m 0.40593 [0m(+0.02643)
     | > avg_log_mle:[91m -0.29886 [0m(+0.01941)
     | > avg_loss_dur:[91m 0.70478 [0m(+0.00702)


[4m[1m > EPOCH: 417/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:30:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00400)
     | > avg_loss:[91m 0.44961 [0m(+0.04368)
     | > avg_log_mle:[92m -0.31169 [0m(-0.01283)
     | > avg_loss_dur:[91m 0.76129 [0m(+0.05651)


[4m[1m > EPOCH: 418/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:30:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00300)
     | > avg_loss:[92m 0.38771 [0m(-0.06189)
     | > avg_log_mle:[92m -0.31478 [0m(-0.00310)
     | > avg_loss_dur:[92m 0.70250 [0m(-0.05879)


[4m[1m > EPOCH: 419/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:30:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.45965 [0m(+0.07194)
     | > avg_log_mle:[91m -0.30892 [0m(+0.00587)
     | > avg_loss_dur:[91m 0.76857 [0m(+0.06607)


[4m[1m > EPOCH: 420/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:30:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.43544 [0m(-0.02421)
     | > avg_log_mle:[91m -0.29594 [0m(+0.01297)
     | > avg_loss_dur:[92m 0.73139 [0m(-0.03718)


[4m[1m > EPOCH: 421/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:30:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.38657 [0m(-0.04888)
     | > avg_log_mle:[92m -0.30211 [0m(-0.00616)
     | > avg_loss_dur:[92m 0.68867 [0m(-0.04271)


[4m[1m > EPOCH: 422/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:30:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.43596 [0m(+0.04940)
     | > avg_log_mle:[92m -0.31168 [0m(-0.00957)
     | > avg_loss_dur:[91m 0.74764 [0m(+0.05896)


[4m[1m > EPOCH: 423/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:31:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.38709 [0m(-0.04887)
     | > avg_log_mle:[91m -0.29102 [0m(+0.02066)
     | > avg_loss_dur:[92m 0.67811 [0m(-0.06953)


[4m[1m > EPOCH: 424/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:31:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.41862 [0m(+0.03152)
     | > avg_log_mle:[92m -0.32295 [0m(-0.03194)
     | > avg_loss_dur:[91m 0.74157 [0m(+0.06346)


[4m[1m > EPOCH: 425/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:31:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1275[0m
     | > loss: -0.08521  (-0.08521)
     | > log_mle: -0.35744  (-0.35744)
     | > loss_dur: 0.27223  (0.27223)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 23.16655  (23.16655)
     | > current_lr: 0.00011 
     | > step_time: 0.72570  (0.72567)
     | > loader_time: 0.32230  (0.32228)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.43052 [0m(+0.01190)
     | > avg_log_mle:[92m -0.32478 [0m(-0.00182)
     | > avg_loss_dur:[91m 0.75530 [0m(+0.01372)


[4m[1m > EPOCH: 426/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:31:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.40579 [0m(-0.02473)
     | > avg_log_mle:[91m -0.31405 [0m(+0.01073)
     | > avg_loss_dur:[92m 0.71984 [0m(-0.03546)


[4m[1m > EPOCH: 427/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:31:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.42492 [0m(+0.01913)
     | > avg_log_mle:[92m -0.31554 [0m(-0.00149)
     | > avg_loss_dur:[91m 0.74046 [0m(+0.02062)


[4m[1m > EPOCH: 428/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:31:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.40818 [0m(-0.01673)
     | > avg_log_mle:[92m -0.32475 [0m(-0.00921)
     | > avg_loss_dur:[92m 0.73294 [0m(-0.00752)


[4m[1m > EPOCH: 429/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:31:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.41366 [0m(+0.00548)
     | > avg_log_mle:[91m -0.32129 [0m(+0.00346)
     | > avg_loss_dur:[91m 0.73495 [0m(+0.00202)


[4m[1m > EPOCH: 430/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:32:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[91m 0.41641 [0m(+0.00275)
     | > avg_log_mle:[92m -0.32281 [0m(-0.00151)
     | > avg_loss_dur:[91m 0.73922 [0m(+0.00426)


[4m[1m > EPOCH: 431/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:32:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.39348 [0m(-0.02293)
     | > avg_log_mle:[91m -0.32229 [0m(+0.00052)
     | > avg_loss_dur:[92m 0.71577 [0m(-0.02345)


[4m[1m > EPOCH: 432/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:32:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.40816 [0m(+0.01468)
     | > avg_log_mle:[92m -0.32670 [0m(-0.00441)
     | > avg_loss_dur:[91m 0.73486 [0m(+0.01909)


[4m[1m > EPOCH: 433/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:32:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1300[0m
     | > loss: -0.03161  (-0.03161)
     | > log_mle: -0.33183  (-0.33183)
     | > loss_dur: 0.30022  (0.30022)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 12.65572  (12.65572)
     | > current_lr: 0.00011 
     | > step_time: 1.03520  (1.03524)
     | > loader_time: 0.41640  (0.41638)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.41701 [0m(+0.00885)
     | > avg_log_mle:[91m -0.32214 [0m(+0.00455)
     | > avg_loss_dur:[91m 0.73915 [0m(+0.00429)


[4m[1m > EPOCH: 434/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:32:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.40125 [0m(-0.01576)
     | > avg_log_mle:[92m -0.33215 [0m(-0.01001)
     | > avg_loss_dur:[92m 0.73340 [0m(-0.00575)


[4m[1m > EPOCH: 435/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:32:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.39926 [0m(-0.00199)
     | > avg_log_mle:[91m -0.32413 [0m(+0.00801)
     | > avg_loss_dur:[92m 0.72339 [0m(-0.01001)


[4m[1m > EPOCH: 436/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:33:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.41198 [0m(+0.01273)
     | > avg_log_mle:[92m -0.32854 [0m(-0.00441)
     | > avg_loss_dur:[91m 0.74053 [0m(+0.01714)


[4m[1m > EPOCH: 437/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:33:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.40332 [0m(-0.00867)
     | > avg_log_mle:[92m -0.33029 [0m(-0.00174)
     | > avg_loss_dur:[92m 0.73361 [0m(-0.00692)


[4m[1m > EPOCH: 438/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:33:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.42506 [0m(+0.02174)
     | > avg_log_mle:[92m -0.33141 [0m(-0.00113)
     | > avg_loss_dur:[91m 0.75647 [0m(+0.02287)


[4m[1m > EPOCH: 439/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:33:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.37226 [0m(-0.05280)
     | > avg_log_mle:[91m -0.33024 [0m(+0.00118)
     | > avg_loss_dur:[92m 0.70250 [0m(-0.05397)


[4m[1m > EPOCH: 440/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:33:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.38959 [0m(+0.01733)
     | > avg_log_mle:[91m -0.32666 [0m(+0.00358)
     | > avg_loss_dur:[91m 0.71625 [0m(+0.01375)


[4m[1m > EPOCH: 441/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:33:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1325[0m
     | > loss: -0.09702  (-0.06346)
     | > log_mle: -0.44753  (-0.39057)
     | > loss_dur: 0.35052  (0.32710)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 56.89978  (46.28015)
     | > current_lr: 0.00011 
     | > step_time: 0.40840  (0.72566)
     | > loader_time: 0.11210  (0.26474)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.44504 [0m(+0.05545)
     | > avg_log_mle:[91m -0.30435 [0m(+0.02230)
     | > avg_loss_dur:[91m 0.74939 [0m(+0.03315)


[4m[1m > EPOCH: 442/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:33:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.39310 [0m(-0.05194)
     | > avg_log_mle:[92m -0.32899 [0m(-0.02464)
     | > avg_loss_dur:[92m 0.72209 [0m(-0.02730)


[4m[1m > EPOCH: 443/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:34:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.40710 [0m(+0.01400)
     | > avg_log_mle:[91m -0.32430 [0m(+0.00469)
     | > avg_loss_dur:[91m 0.73140 [0m(+0.00931)


[4m[1m > EPOCH: 444/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:34:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.37052 [0m(-0.03658)
     | > avg_log_mle:[92m -0.32648 [0m(-0.00218)
     | > avg_loss_dur:[92m 0.69700 [0m(-0.03440)


[4m[1m > EPOCH: 445/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:34:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00101)
     | > avg_loss:[91m 0.39976 [0m(+0.02924)
     | > avg_log_mle:[91m -0.32535 [0m(+0.00113)
     | > avg_loss_dur:[91m 0.72511 [0m(+0.02811)


[4m[1m > EPOCH: 446/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:34:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00099)
     | > avg_loss:[92m 0.39885 [0m(-0.00091)
     | > avg_log_mle:[92m -0.33054 [0m(-0.00519)
     | > avg_loss_dur:[91m 0.72939 [0m(+0.00428)


[4m[1m > EPOCH: 447/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:34:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.43001 [0m(+0.03116)
     | > avg_log_mle:[91m -0.32500 [0m(+0.00553)
     | > avg_loss_dur:[91m 0.75501 [0m(+0.02562)


[4m[1m > EPOCH: 448/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:34:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.41038 [0m(-0.01963)
     | > avg_log_mle:[92m -0.32846 [0m(-0.00346)
     | > avg_loss_dur:[92m 0.73884 [0m(-0.01617)


[4m[1m > EPOCH: 449/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:35:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.45098 [0m(+0.04060)
     | > avg_log_mle:[91m -0.29779 [0m(+0.03067)
     | > avg_loss_dur:[91m 0.74877 [0m(+0.00993)


[4m[1m > EPOCH: 450/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:35:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1350[0m
     | > loss: -0.08623  (-0.08623)
     | > log_mle: -0.36361  (-0.36361)
     | > loss_dur: 0.27738  (0.27738)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 17.84526  (17.84526)
     | > current_lr: 0.00011 
     | > step_time: 0.72870  (0.72866)
     | > loader_time: 0.31730  (0.31728)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.40613 [0m(-0.04484)
     | > avg_log_mle:[91m -0.29488 [0m(+0.00292)
     | > avg_loss_dur:[92m 0.70101 [0m(-0.04776)


[4m[1m > EPOCH: 451/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:35:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.41967 [0m(+0.01354)
     | > avg_log_mle:[91m -0.28489 [0m(+0.00999)
     | > avg_loss_dur:[91m 0.70456 [0m(+0.00355)


[4m[1m > EPOCH: 452/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:35:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.37372 [0m(-0.04595)
     | > avg_log_mle:[92m -0.30833 [0m(-0.02343)
     | > avg_loss_dur:[92m 0.68205 [0m(-0.02252)


[4m[1m > EPOCH: 453/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:35:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.37182 [0m(-0.00191)
     | > avg_log_mle:[92m -0.30926 [0m(-0.00093)
     | > avg_loss_dur:[92m 0.68107 [0m(-0.00097)


[4m[1m > EPOCH: 454/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:35:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[91m 0.42452 [0m(+0.05271)
     | > avg_log_mle:[91m -0.29665 [0m(+0.01261)
     | > avg_loss_dur:[91m 0.72118 [0m(+0.04010)


[4m[1m > EPOCH: 455/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:35:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[92m 0.36254 [0m(-0.06199)
     | > avg_log_mle:[92m -0.32253 [0m(-0.02587)
     | > avg_loss_dur:[92m 0.68506 [0m(-0.03611)


[4m[1m > EPOCH: 456/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:36:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 0.35706 [0m(-0.00547)
     | > avg_log_mle:[92m -0.33130 [0m(-0.00877)
     | > avg_loss_dur:[91m 0.68836 [0m(+0.00330)


[4m[1m > EPOCH: 457/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:36:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.41539 [0m(+0.05833)
     | > avg_log_mle:[91m -0.29544 [0m(+0.03585)
     | > avg_loss_dur:[91m 0.71083 [0m(+0.02247)


[4m[1m > EPOCH: 458/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:36:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1375[0m
     | > loss: -0.02526  (-0.02526)
     | > log_mle: -0.33353  (-0.33353)
     | > loss_dur: 0.30827  (0.30827)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 20.96629  (20.96629)
     | > current_lr: 0.00011 
     | > step_time: 1.03590  (1.03594)
     | > loader_time: 0.42040  (0.42038)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.36801 [0m(-0.04738)
     | > avg_log_mle:[92m -0.33746 [0m(-0.04202)
     | > avg_loss_dur:[92m 0.70547 [0m(-0.00536)


[4m[1m > EPOCH: 459/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:36:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.37823 [0m(+0.01022)
     | > avg_log_mle:[91m -0.32751 [0m(+0.00996)
     | > avg_loss_dur:[91m 0.70574 [0m(+0.00026)


[4m[1m > EPOCH: 460/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:36:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.37062 [0m(-0.00761)
     | > avg_log_mle:[92m -0.33344 [0m(-0.00593)
     | > avg_loss_dur:[92m 0.70406 [0m(-0.00167)


[4m[1m > EPOCH: 461/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:36:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.40031 [0m(+0.02968)
     | > avg_log_mle:[91m -0.31482 [0m(+0.01862)
     | > avg_loss_dur:[91m 0.71513 [0m(+0.01106)


[4m[1m > EPOCH: 462/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:37:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.37680 [0m(-0.02351)
     | > avg_log_mle:[92m -0.32844 [0m(-0.01362)
     | > avg_loss_dur:[92m 0.70524 [0m(-0.00989)


[4m[1m > EPOCH: 463/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:37:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39125 [0m(+0.01445)
     | > avg_log_mle:[92m -0.32954 [0m(-0.00110)
     | > avg_loss_dur:[91m 0.72079 [0m(+0.01555)


[4m[1m > EPOCH: 464/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:37:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.40378 [0m(+0.01253)
     | > avg_log_mle:[91m -0.32750 [0m(+0.00204)
     | > avg_loss_dur:[91m 0.73128 [0m(+0.01049)


[4m[1m > EPOCH: 465/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:37:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.38242 [0m(-0.02136)
     | > avg_log_mle:[91m -0.26721 [0m(+0.06029)
     | > avg_loss_dur:[92m 0.64963 [0m(-0.08165)


[4m[1m > EPOCH: 466/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:37:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1400[0m
     | > loss: -0.11086  (-0.03994)
     | > log_mle: -0.45332  (-0.38025)
     | > loss_dur: 0.34246  (0.34031)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 17.05877  (13.75981)
     | > current_lr: 0.00012 
     | > step_time: 0.40040  (0.71665)
     | > loader_time: 0.10910  (0.26524)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.53306 [0m(+0.15064)
     | > avg_log_mle:[92m -0.26954 [0m(-0.00234)
     | > avg_loss_dur:[91m 0.80260 [0m(+0.15297)


[4m[1m > EPOCH: 467/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:37:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.40590 [0m(-0.12716)
     | > avg_log_mle:[92m -0.29214 [0m(-0.02259)
     | > avg_loss_dur:[92m 0.69804 [0m(-0.10456)


[4m[1m > EPOCH: 468/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:37:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 0.37966 [0m(-0.02624)
     | > avg_log_mle:[92m -0.31487 [0m(-0.02273)
     | > avg_loss_dur:[92m 0.69453 [0m(-0.00351)


[4m[1m > EPOCH: 469/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:38:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[91m 0.42646 [0m(+0.04679)
     | > avg_log_mle:[91m -0.30903 [0m(+0.00583)
     | > avg_loss_dur:[91m 0.73549 [0m(+0.04096)


[4m[1m > EPOCH: 470/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:38:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.42590 [0m(-0.00056)
     | > avg_log_mle:[92m -0.31662 [0m(-0.00759)
     | > avg_loss_dur:[91m 0.74252 [0m(+0.00703)


[4m[1m > EPOCH: 471/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:38:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[92m 0.39276 [0m(-0.03314)
     | > avg_log_mle:[91m -0.31394 [0m(+0.00268)
     | > avg_loss_dur:[92m 0.70670 [0m(-0.03582)


[4m[1m > EPOCH: 472/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:38:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 0.34364 [0m(-0.04913)
     | > avg_log_mle:[91m -0.30390 [0m(+0.01004)
     | > avg_loss_dur:[92m 0.64754 [0m(-0.05917)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_1419.pth

[4m[1m > EPOCH: 473/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:38:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00300)
     | > avg_loss:[92m 0.32917 [0m(-0.01447)
     | > avg_log_mle:[92m -0.33063 [0m(-0.02673)
     | > avg_loss_dur:[91m 0.65980 [0m(+0.01226)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_1422.pth

[4m[1m > EPOCH: 474/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:38:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.39046 [0m(+0.06129)
     | > avg_log_mle:[91m -0.32012 [0m(+0.01051)
     | > avg_loss_dur:[91m 0.71058 [0m(+0.05078)


[4m[1m > EPOCH: 475/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:39:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1425[0m
     | > loss: -0.10796  (-0.10796)
     | > log_mle: -0.37943  (-0.37943)
     | > loss_dur: 0.27147  (0.27147)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 38.58810  (38.58810)
     | > current_lr: 0.00012 
     | > step_time: 0.72570  (0.72566)
     | > loader_time: 0.31930  (0.31929)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.30637 [0m(-0.08409)
     | > avg_log_mle:[92m -0.33798 [0m(-0.01786)
     | > avg_loss_dur:[92m 0.64434 [0m(-0.06624)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_1428.pth

[4m[1m > EPOCH: 476/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:39:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.36225 [0m(+0.05589)
     | > avg_log_mle:[91m -0.33125 [0m(+0.00672)
     | > avg_loss_dur:[91m 0.69351 [0m(+0.04916)


[4m[1m > EPOCH: 477/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:39:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.36712 [0m(+0.00487)
     | > avg_log_mle:[91m -0.32933 [0m(+0.00192)
     | > avg_loss_dur:[91m 0.69646 [0m(+0.00295)


[4m[1m > EPOCH: 478/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:39:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.36631 [0m(-0.00082)
     | > avg_log_mle:[92m -0.33495 [0m(-0.00562)
     | > avg_loss_dur:[91m 0.70126 [0m(+0.00480)


[4m[1m > EPOCH: 479/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:39:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.35789 [0m(-0.00841)
     | > avg_log_mle:[92m -0.33674 [0m(-0.00179)
     | > avg_loss_dur:[92m 0.69463 [0m(-0.00663)


[4m[1m > EPOCH: 480/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:39:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.37625 [0m(+0.01835)
     | > avg_log_mle:[91m -0.33407 [0m(+0.00267)
     | > avg_loss_dur:[91m 0.71032 [0m(+0.01568)


[4m[1m > EPOCH: 481/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:39:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 0.32979 [0m(-0.04646)
     | > avg_log_mle:[91m -0.32667 [0m(+0.00740)
     | > avg_loss_dur:[92m 0.65645 [0m(-0.05386)


[4m[1m > EPOCH: 482/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:40:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[91m 0.37702 [0m(+0.04724)
     | > avg_log_mle:[91m -0.31515 [0m(+0.01152)
     | > avg_loss_dur:[91m 0.69217 [0m(+0.03572)


[4m[1m > EPOCH: 483/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:40:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1450[0m
     | > loss: 0.02966  (0.02966)
     | > log_mle: -0.27845  (-0.27845)
     | > loss_dur: 0.30811  (0.30811)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 108.37866  (108.37866)
     | > current_lr: 0.00012 
     | > step_time: 1.03290  (1.03294)
     | > loader_time: 0.41440  (0.41438)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[91m 0.49572 [0m(+0.11869)
     | > avg_log_mle:[91m -0.23025 [0m(+0.08490)
     | > avg_loss_dur:[91m 0.72596 [0m(+0.03379)


[4m[1m > EPOCH: 484/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:40:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.39534 [0m(-0.10037)
     | > avg_log_mle:[92m -0.29077 [0m(-0.06052)
     | > avg_loss_dur:[92m 0.68612 [0m(-0.03985)


[4m[1m > EPOCH: 485/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:40:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.43125 [0m(+0.03590)
     | > avg_log_mle:[91m -0.27566 [0m(+0.01511)
     | > avg_loss_dur:[91m 0.70691 [0m(+0.02080)


[4m[1m > EPOCH: 486/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:40:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.42267 [0m(-0.00858)
     | > avg_log_mle:[92m -0.30701 [0m(-0.03134)
     | > avg_loss_dur:[91m 0.72968 [0m(+0.02276)


[4m[1m > EPOCH: 487/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:40:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.38759 [0m(-0.03508)
     | > avg_log_mle:[92m -0.31269 [0m(-0.00569)
     | > avg_loss_dur:[92m 0.70028 [0m(-0.02939)


[4m[1m > EPOCH: 488/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:41:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.43259 [0m(+0.04500)
     | > avg_log_mle:[92m -0.32649 [0m(-0.01380)
     | > avg_loss_dur:[91m 0.75908 [0m(+0.05880)


[4m[1m > EPOCH: 489/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:41:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.39004 [0m(-0.04255)
     | > avg_log_mle:[92m -0.33241 [0m(-0.00591)
     | > avg_loss_dur:[92m 0.72245 [0m(-0.03663)


[4m[1m > EPOCH: 490/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:41:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.40078 [0m(+0.01074)
     | > avg_log_mle:[91m -0.31623 [0m(+0.01618)
     | > avg_loss_dur:[92m 0.71701 [0m(-0.00544)


[4m[1m > EPOCH: 491/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:41:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1475[0m
     | > loss: -0.15696  (-0.10207)
     | > log_mle: -0.49521  (-0.42141)
     | > loss_dur: 0.33825  (0.31934)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 29.57052  (26.14679)
     | > current_lr: 0.00012 
     | > step_time: 0.40340  (0.71766)
     | > loader_time: 0.11110  (0.26524)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.36343 [0m(-0.03735)
     | > avg_log_mle:[92m -0.33242 [0m(-0.01619)
     | > avg_loss_dur:[92m 0.69585 [0m(-0.02116)


[4m[1m > EPOCH: 492/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:41:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.37008 [0m(+0.00665)
     | > avg_log_mle:[92m -0.33920 [0m(-0.00678)
     | > avg_loss_dur:[91m 0.70928 [0m(+0.01343)


[4m[1m > EPOCH: 493/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:41:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.34992 [0m(-0.02016)
     | > avg_log_mle:[91m -0.33209 [0m(+0.00710)
     | > avg_loss_dur:[92m 0.68201 [0m(-0.02726)


[4m[1m > EPOCH: 494/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:41:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[91m 0.37098 [0m(+0.02106)
     | > avg_log_mle:[92m -0.33699 [0m(-0.00490)
     | > avg_loss_dur:[91m 0.70797 [0m(+0.02596)


[4m[1m > EPOCH: 495/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:42:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[91m 0.37271 [0m(+0.00173)
     | > avg_log_mle:[92m -0.34135 [0m(-0.00435)
     | > avg_loss_dur:[91m 0.71405 [0m(+0.00608)


[4m[1m > EPOCH: 496/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:42:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.35996 [0m(-0.01274)
     | > avg_log_mle:[92m -0.34412 [0m(-0.00277)
     | > avg_loss_dur:[92m 0.70408 [0m(-0.00997)


[4m[1m > EPOCH: 497/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:42:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.30731 [0m(-0.05266)
     | > avg_log_mle:[91m -0.33671 [0m(+0.00741)
     | > avg_loss_dur:[92m 0.64402 [0m(-0.06007)


[4m[1m > EPOCH: 498/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:42:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.38860 [0m(+0.08129)
     | > avg_log_mle:[91m -0.31476 [0m(+0.02195)
     | > avg_loss_dur:[91m 0.70336 [0m(+0.05935)


[4m[1m > EPOCH: 499/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:42:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[92m 0.38669 [0m(-0.00191)
     | > avg_log_mle:[92m -0.33858 [0m(-0.02381)
     | > avg_loss_dur:[91m 0.72527 [0m(+0.02191)


[4m[1m > EPOCH: 500/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:42:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1500[0m
     | > loss: -0.14179  (-0.14179)
     | > log_mle: -0.40810  (-0.40810)
     | > loss_dur: 0.26632  (0.26632)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 10.62669  (10.62669)
     | > current_lr: 0.00013 
     | > step_time: 0.73770  (0.73767)
     | > loader_time: 0.31930  (0.31929)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.38239 [0m(-0.00430)
     | > avg_log_mle:[91m -0.33437 [0m(+0.00420)
     | > avg_loss_dur:[92m 0.71677 [0m(-0.00850)


[4m[1m > EPOCH: 501/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:42:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.42876 [0m(+0.04637)
     | > avg_log_mle:[91m -0.27231 [0m(+0.06206)
     | > avg_loss_dur:[92m 0.70107 [0m(-0.01569)


[4m[1m > EPOCH: 502/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:43:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.46476 [0m(+0.03600)
     | > avg_log_mle:[92m -0.29078 [0m(-0.01847)
     | > avg_loss_dur:[91m 0.75555 [0m(+0.05448)


[4m[1m > EPOCH: 503/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:43:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.32895 [0m(-0.13582)
     | > avg_log_mle:[92m -0.32615 [0m(-0.03537)
     | > avg_loss_dur:[92m 0.65510 [0m(-0.10045)


[4m[1m > EPOCH: 504/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:43:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.42827 [0m(+0.09932)
     | > avg_log_mle:[91m -0.31755 [0m(+0.00860)
     | > avg_loss_dur:[91m 0.74582 [0m(+0.09072)


[4m[1m > EPOCH: 505/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:43:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.38725 [0m(-0.04101)
     | > avg_log_mle:[92m -0.32350 [0m(-0.00595)
     | > avg_loss_dur:[92m 0.71076 [0m(-0.03506)


[4m[1m > EPOCH: 506/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:43:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 0.35369 [0m(-0.03356)
     | > avg_log_mle:[91m -0.31585 [0m(+0.00765)
     | > avg_loss_dur:[92m 0.66954 [0m(-0.04121)


[4m[1m > EPOCH: 507/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:43:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[91m 0.36370 [0m(+0.01001)
     | > avg_log_mle:[92m -0.32794 [0m(-0.01209)
     | > avg_loss_dur:[91m 0.69164 [0m(+0.02210)


[4m[1m > EPOCH: 508/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:44:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1525[0m
     | > loss: -0.06389  (-0.06389)
     | > log_mle: -0.35958  (-0.35958)
     | > loss_dur: 0.29568  (0.29568)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 6.93573  (6.93573)
     | > current_lr: 0.00013 
     | > step_time: 1.03900  (1.03895)
     | > loader_time: 0.41640  (0.41637)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.48206 [0m(+0.11836)
     | > avg_log_mle:[91m -0.29235 [0m(+0.03559)
     | > avg_loss_dur:[91m 0.77441 [0m(+0.08277)


[4m[1m > EPOCH: 509/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:44:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.36069 [0m(-0.12137)
     | > avg_log_mle:[92m -0.32369 [0m(-0.03135)
     | > avg_loss_dur:[92m 0.68438 [0m(-0.09002)


[4m[1m > EPOCH: 510/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:44:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.38433 [0m(+0.02364)
     | > avg_log_mle:[92m -0.33424 [0m(-0.01055)
     | > avg_loss_dur:[91m 0.71857 [0m(+0.03419)


[4m[1m > EPOCH: 511/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:44:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.34628 [0m(-0.03805)
     | > avg_log_mle:[91m -0.32653 [0m(+0.00771)
     | > avg_loss_dur:[92m 0.67281 [0m(-0.04576)


[4m[1m > EPOCH: 512/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:44:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.36165 [0m(+0.01537)
     | > avg_log_mle:[92m -0.33692 [0m(-0.01039)
     | > avg_loss_dur:[91m 0.69857 [0m(+0.02576)


[4m[1m > EPOCH: 513/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:44:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.37074 [0m(+0.00909)
     | > avg_log_mle:[92m -0.34014 [0m(-0.00322)
     | > avg_loss_dur:[91m 0.71088 [0m(+0.01231)


[4m[1m > EPOCH: 514/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:44:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.34135 [0m(-0.02939)
     | > avg_log_mle:[92m -0.34057 [0m(-0.00043)
     | > avg_loss_dur:[92m 0.68192 [0m(-0.02896)


[4m[1m > EPOCH: 515/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:45:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.35004 [0m(+0.00869)
     | > avg_log_mle:[92m -0.34810 [0m(-0.00752)
     | > avg_loss_dur:[91m 0.69814 [0m(+0.01621)


[4m[1m > EPOCH: 516/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:45:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1550[0m
     | > loss: -0.19183  (-0.13673)
     | > log_mle: -0.52584  (-0.45199)
     | > loss_dur: 0.33401  (0.31525)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 24.31608  (22.66822)
     | > current_lr: 0.00013 
     | > step_time: 0.39940  (0.71866)
     | > loader_time: 0.10210  (0.26173)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.33935 [0m(-0.01069)
     | > avg_log_mle:[91m -0.33228 [0m(+0.01582)
     | > avg_loss_dur:[92m 0.67163 [0m(-0.02651)


[4m[1m > EPOCH: 517/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:45:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[92m 0.33627 [0m(-0.00308)
     | > avg_log_mle:[92m -0.33838 [0m(-0.00610)
     | > avg_loss_dur:[91m 0.67465 [0m(+0.00303)


[4m[1m > EPOCH: 518/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:45:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.31149 [0m(-0.02478)
     | > avg_log_mle:[92m -0.34644 [0m(-0.00806)
     | > avg_loss_dur:[92m 0.65793 [0m(-0.01672)


[4m[1m > EPOCH: 519/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:45:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39780 [0m(+0.08631)
     | > avg_log_mle:[91m -0.33081 [0m(+0.01563)
     | > avg_loss_dur:[91m 0.72861 [0m(+0.07068)


[4m[1m > EPOCH: 520/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:45:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.38532 [0m(-0.01248)
     | > avg_log_mle:[92m -0.33882 [0m(-0.00801)
     | > avg_loss_dur:[92m 0.72414 [0m(-0.00447)


[4m[1m > EPOCH: 521/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:46:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.34199 [0m(-0.04333)
     | > avg_log_mle:[91m -0.33555 [0m(+0.00327)
     | > avg_loss_dur:[92m 0.67754 [0m(-0.04660)


[4m[1m > EPOCH: 522/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:46:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 0.34037 [0m(-0.00163)
     | > avg_log_mle:[92m -0.34649 [0m(-0.01094)
     | > avg_loss_dur:[91m 0.68686 [0m(+0.00932)


[4m[1m > EPOCH: 523/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:46:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39396 [0m(+0.05359)
     | > avg_log_mle:[91m -0.32788 [0m(+0.01861)
     | > avg_loss_dur:[91m 0.72184 [0m(+0.03498)


[4m[1m > EPOCH: 524/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:46:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.35101 [0m(-0.04295)
     | > avg_log_mle:[92m -0.34277 [0m(-0.01489)
     | > avg_loss_dur:[92m 0.69377 [0m(-0.02807)


[4m[1m > EPOCH: 525/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:46:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1575[0m
     | > loss: -0.16129  (-0.16129)
     | > log_mle: -0.42714  (-0.42714)
     | > loss_dur: 0.26585  (0.26585)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 35.13165  (35.13165)
     | > current_lr: 0.00013 
     | > step_time: 0.72870  (0.72867)
     | > loader_time: 0.31630  (0.31629)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39320 [0m(+0.04219)
     | > avg_log_mle:[91m -0.33744 [0m(+0.00532)
     | > avg_loss_dur:[91m 0.73064 [0m(+0.03687)


[4m[1m > EPOCH: 526/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:46:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.41084 [0m(+0.01765)
     | > avg_log_mle:[91m -0.33121 [0m(+0.00623)
     | > avg_loss_dur:[91m 0.74206 [0m(+0.01142)


[4m[1m > EPOCH: 527/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:46:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00100)
     | > avg_loss:[92m 0.31371 [0m(-0.09714)
     | > avg_log_mle:[92m -0.35051 [0m(-0.01930)
     | > avg_loss_dur:[92m 0.66422 [0m(-0.07783)


[4m[1m > EPOCH: 528/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:47:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[91m 0.42277 [0m(+0.10906)
     | > avg_log_mle:[91m -0.30362 [0m(+0.04689)
     | > avg_loss_dur:[91m 0.72639 [0m(+0.06217)


[4m[1m > EPOCH: 529/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:47:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.34272 [0m(-0.08006)
     | > avg_log_mle:[92m -0.34366 [0m(-0.04004)
     | > avg_loss_dur:[92m 0.68637 [0m(-0.04002)


[4m[1m > EPOCH: 530/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:47:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.32185 [0m(-0.02086)
     | > avg_log_mle:[92m -0.34504 [0m(-0.00138)
     | > avg_loss_dur:[92m 0.66689 [0m(-0.01948)


[4m[1m > EPOCH: 531/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:47:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[91m 0.37023 [0m(+0.04837)
     | > avg_log_mle:[91m -0.30723 [0m(+0.03781)
     | > avg_loss_dur:[91m 0.67746 [0m(+0.01056)


[4m[1m > EPOCH: 532/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:47:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.41387 [0m(+0.04365)
     | > avg_log_mle:[92m -0.32056 [0m(-0.01333)
     | > avg_loss_dur:[91m 0.73443 [0m(+0.05698)


[4m[1m > EPOCH: 533/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:47:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1600[0m
     | > loss: -0.08500  (-0.08500)
     | > log_mle: -0.38154  (-0.38154)
     | > loss_dur: 0.29654  (0.29654)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 15.33016  (15.33016)
     | > current_lr: 0.00013 
     | > step_time: 1.03390  (1.03394)
     | > loader_time: 0.43540  (0.43540)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.36614 [0m(-0.04773)
     | > avg_log_mle:[92m -0.35017 [0m(-0.02961)
     | > avg_loss_dur:[92m 0.71631 [0m(-0.01812)


[4m[1m > EPOCH: 534/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:47:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.39431 [0m(+0.02816)
     | > avg_log_mle:[91m -0.29018 [0m(+0.05999)
     | > avg_loss_dur:[92m 0.68448 [0m(-0.03182)


[4m[1m > EPOCH: 535/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:48:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.47291 [0m(+0.07860)
     | > avg_log_mle:[91m -0.27672 [0m(+0.01346)
     | > avg_loss_dur:[91m 0.74962 [0m(+0.06514)


[4m[1m > EPOCH: 536/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:48:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.36631 [0m(-0.10659)
     | > avg_log_mle:[92m -0.29798 [0m(-0.02126)
     | > avg_loss_dur:[92m 0.66429 [0m(-0.08533)


[4m[1m > EPOCH: 537/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:48:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.33253 [0m(-0.03378)
     | > avg_log_mle:[92m -0.33882 [0m(-0.04084)
     | > avg_loss_dur:[91m 0.67135 [0m(+0.00706)


[4m[1m > EPOCH: 538/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:48:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.35232 [0m(+0.01979)
     | > avg_log_mle:[91m -0.31899 [0m(+0.01983)
     | > avg_loss_dur:[92m 0.67130 [0m(-0.00005)


[4m[1m > EPOCH: 539/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:48:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39745 [0m(+0.04514)
     | > avg_log_mle:[91m -0.31495 [0m(+0.00404)
     | > avg_loss_dur:[91m 0.71240 [0m(+0.04110)


[4m[1m > EPOCH: 540/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:48:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.34945 [0m(-0.04800)
     | > avg_log_mle:[92m -0.32658 [0m(-0.01163)
     | > avg_loss_dur:[92m 0.67603 [0m(-0.03638)


[4m[1m > EPOCH: 541/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:49:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1625[0m
     | > loss: -0.19269  (-0.14077)
     | > log_mle: -0.52947  (-0.45626)
     | > loss_dur: 0.33678  (0.31549)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 79.28270  (44.36696)
     | > current_lr: 0.00014 
     | > step_time: 0.40140  (0.72035)
     | > loader_time: 0.10410  (0.26074)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[91m 0.40054 [0m(+0.05109)
     | > avg_log_mle:[91m -0.28942 [0m(+0.03716)
     | > avg_loss_dur:[91m 0.68996 [0m(+0.01393)


[4m[1m > EPOCH: 542/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:49:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.01001 [0m(+0.00000)
     | > avg_loss:[91m 0.40731 [0m(+0.00677)
     | > avg_log_mle:[92m -0.32397 [0m(-0.03455)
     | > avg_loss_dur:[91m 0.73128 [0m(+0.04132)


[4m[1m > EPOCH: 543/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:49:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.39429 [0m(-0.01302)
     | > avg_log_mle:[92m -0.32534 [0m(-0.00137)
     | > avg_loss_dur:[92m 0.71963 [0m(-0.01164)


[4m[1m > EPOCH: 544/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:49:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.29920 [0m(-0.09509)
     | > avg_log_mle:[92m -0.32973 [0m(-0.00438)
     | > avg_loss_dur:[92m 0.62893 [0m(-0.09071)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_1635.pth

[4m[1m > EPOCH: 545/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:49:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.37445 [0m(+0.07525)
     | > avg_log_mle:[92m -0.33279 [0m(-0.00306)
     | > avg_loss_dur:[91m 0.70724 [0m(+0.07831)


[4m[1m > EPOCH: 546/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:49:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.35263 [0m(-0.02182)
     | > avg_log_mle:[92m -0.33432 [0m(-0.00153)
     | > avg_loss_dur:[92m 0.68695 [0m(-0.02029)


[4m[1m > EPOCH: 547/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:49:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.36793 [0m(+0.01530)
     | > avg_log_mle:[92m -0.33680 [0m(-0.00248)
     | > avg_loss_dur:[91m 0.70473 [0m(+0.01778)


[4m[1m > EPOCH: 548/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:50:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.35456 [0m(-0.01338)
     | > avg_log_mle:[92m -0.34287 [0m(-0.00606)
     | > avg_loss_dur:[92m 0.69742 [0m(-0.00731)


[4m[1m > EPOCH: 549/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:50:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.31537 [0m(-0.03919)
     | > avg_log_mle:[91m -0.33124 [0m(+0.01162)
     | > avg_loss_dur:[92m 0.64661 [0m(-0.05081)


[4m[1m > EPOCH: 550/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:50:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1650[0m
     | > loss: -0.16815  (-0.16815)
     | > log_mle: -0.42913  (-0.42913)
     | > loss_dur: 0.26098  (0.26098)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 28.58533  (28.58533)
     | > current_lr: 0.00014 
     | > step_time: 0.74270  (0.74268)
     | > loader_time: 0.32330  (0.32329)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.38057 [0m(+0.06520)
     | > avg_log_mle:[91m -0.31899 [0m(+0.01226)
     | > avg_loss_dur:[91m 0.69956 [0m(+0.05294)


[4m[1m > EPOCH: 551/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:50:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39925 [0m(+0.01868)
     | > avg_log_mle:[92m -0.32579 [0m(-0.00681)
     | > avg_loss_dur:[91m 0.72504 [0m(+0.02548)


[4m[1m > EPOCH: 552/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:50:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.38705 [0m(-0.01220)
     | > avg_log_mle:[92m -0.32581 [0m(-0.00001)
     | > avg_loss_dur:[92m 0.71286 [0m(-0.01219)


[4m[1m > EPOCH: 553/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:50:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.32930 [0m(-0.05775)
     | > avg_log_mle:[92m -0.32944 [0m(-0.00363)
     | > avg_loss_dur:[92m 0.65874 [0m(-0.05412)


[4m[1m > EPOCH: 554/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:51:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.40281 [0m(+0.07351)
     | > avg_log_mle:[91m -0.32251 [0m(+0.00692)
     | > avg_loss_dur:[91m 0.72533 [0m(+0.06659)


[4m[1m > EPOCH: 555/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:51:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.37857 [0m(-0.02424)
     | > avg_log_mle:[92m -0.32804 [0m(-0.00552)
     | > avg_loss_dur:[92m 0.70661 [0m(-0.01872)


[4m[1m > EPOCH: 556/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:51:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.36007 [0m(-0.01850)
     | > avg_log_mle:[92m -0.33955 [0m(-0.01151)
     | > avg_loss_dur:[92m 0.69962 [0m(-0.00699)


[4m[1m > EPOCH: 557/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:51:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.35058 [0m(-0.00949)
     | > avg_log_mle:[91m -0.32166 [0m(+0.01789)
     | > avg_loss_dur:[92m 0.67224 [0m(-0.02738)


[4m[1m > EPOCH: 558/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:51:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1675[0m
     | > loss: -0.09182  (-0.09182)
     | > log_mle: -0.38908  (-0.38908)
     | > loss_dur: 0.29727  (0.29727)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 36.06175  (36.06175)
     | > current_lr: 0.00014 
     | > step_time: 1.04600  (1.04595)
     | > loader_time: 0.41740  (0.41738)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.36207 [0m(+0.01149)
     | > avg_log_mle:[92m -0.33735 [0m(-0.01569)
     | > avg_loss_dur:[91m 0.69942 [0m(+0.02718)


[4m[1m > EPOCH: 559/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:51:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.38185 [0m(+0.01977)
     | > avg_log_mle:[91m -0.33380 [0m(+0.00355)
     | > avg_loss_dur:[91m 0.71565 [0m(+0.01623)


[4m[1m > EPOCH: 560/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:51:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.32983 [0m(-0.05202)
     | > avg_log_mle:[91m -0.32445 [0m(+0.00935)
     | > avg_loss_dur:[92m 0.65428 [0m(-0.06137)


[4m[1m > EPOCH: 561/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:52:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.35017 [0m(+0.02035)
     | > avg_log_mle:[91m -0.31246 [0m(+0.01200)
     | > avg_loss_dur:[91m 0.66263 [0m(+0.00835)


[4m[1m > EPOCH: 562/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:52:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39767 [0m(+0.04749)
     | > avg_log_mle:[92m -0.32514 [0m(-0.01268)
     | > avg_loss_dur:[91m 0.72281 [0m(+0.06018)


[4m[1m > EPOCH: 563/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:52:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.33004 [0m(-0.06763)
     | > avg_log_mle:[92m -0.35073 [0m(-0.02559)
     | > avg_loss_dur:[92m 0.68077 [0m(-0.04204)


[4m[1m > EPOCH: 564/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:52:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.36120 [0m(+0.03115)
     | > avg_log_mle:[91m -0.34133 [0m(+0.00940)
     | > avg_loss_dur:[91m 0.70252 [0m(+0.02175)


[4m[1m > EPOCH: 565/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:52:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.34688 [0m(-0.01431)
     | > avg_log_mle:[92m -0.34245 [0m(-0.00112)
     | > avg_loss_dur:[92m 0.68933 [0m(-0.01319)


[4m[1m > EPOCH: 566/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:52:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1700[0m
     | > loss: -0.24332  (-0.17545)
     | > log_mle: -0.56809  (-0.48552)
     | > loss_dur: 0.32477  (0.31006)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 25.21235  (29.37578)
     | > current_lr: 0.00014 
     | > step_time: 0.39640  (0.71365)
     | > loader_time: 0.10010  (0.25924)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.35346 [0m(+0.00658)
     | > avg_log_mle:[91m -0.31893 [0m(+0.02351)
     | > avg_loss_dur:[92m 0.67239 [0m(-0.01694)


[4m[1m > EPOCH: 567/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:52:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.32233 [0m(-0.03113)
     | > avg_log_mle:[92m -0.34677 [0m(-0.02784)
     | > avg_loss_dur:[92m 0.66910 [0m(-0.00329)


[4m[1m > EPOCH: 568/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:53:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[91m 0.34132 [0m(+0.01899)
     | > avg_log_mle:[91m -0.33904 [0m(+0.00773)
     | > avg_loss_dur:[91m 0.68036 [0m(+0.01126)


[4m[1m > EPOCH: 569/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:53:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.35974 [0m(+0.01842)
     | > avg_log_mle:[92m -0.34489 [0m(-0.00586)
     | > avg_loss_dur:[91m 0.70464 [0m(+0.02428)


[4m[1m > EPOCH: 570/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:53:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39488 [0m(+0.03514)
     | > avg_log_mle:[91m -0.23139 [0m(+0.11350)
     | > avg_loss_dur:[92m 0.62627 [0m(-0.07836)


[4m[1m > EPOCH: 571/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:53:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.40676 [0m(+0.01188)
     | > avg_log_mle:[92m -0.33744 [0m(-0.10605)
     | > avg_loss_dur:[91m 0.74421 [0m(+0.11793)


[4m[1m > EPOCH: 572/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:53:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.37587 [0m(-0.03089)
     | > avg_log_mle:[91m -0.28526 [0m(+0.05218)
     | > avg_loss_dur:[92m 0.66113 [0m(-0.08307)


[4m[1m > EPOCH: 573/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:53:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.40401 [0m(+0.02814)
     | > avg_log_mle:[92m -0.29477 [0m(-0.00951)
     | > avg_loss_dur:[91m 0.69878 [0m(+0.03765)


[4m[1m > EPOCH: 574/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:54:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.41661 [0m(+0.01260)
     | > avg_log_mle:[92m -0.32767 [0m(-0.03289)
     | > avg_loss_dur:[91m 0.74427 [0m(+0.04549)


[4m[1m > EPOCH: 575/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:54:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1725[0m
     | > loss: -0.16625  (-0.16625)
     | > log_mle: -0.43135  (-0.43135)
     | > loss_dur: 0.26510  (0.26510)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 25.72653  (25.72653)
     | > current_lr: 0.00014 
     | > step_time: 0.73170  (0.73168)
     | > loader_time: 0.31830  (0.31828)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.37099 [0m(-0.04561)
     | > avg_log_mle:[91m -0.30907 [0m(+0.01860)
     | > avg_loss_dur:[92m 0.68006 [0m(-0.06421)


[4m[1m > EPOCH: 576/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:54:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.44780 [0m(+0.07680)
     | > avg_log_mle:[91m -0.25533 [0m(+0.05374)
     | > avg_loss_dur:[91m 0.70313 [0m(+0.02306)


[4m[1m > EPOCH: 577/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:54:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 0.39560 [0m(-0.05220)
     | > avg_log_mle:[92m -0.32065 [0m(-0.06532)
     | > avg_loss_dur:[91m 0.71625 [0m(+0.01312)


[4m[1m > EPOCH: 578/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:54:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[91m 0.44088 [0m(+0.04528)
     | > avg_log_mle:[91m -0.29973 [0m(+0.02092)
     | > avg_loss_dur:[91m 0.74061 [0m(+0.02436)


[4m[1m > EPOCH: 579/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:54:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.41654 [0m(-0.02434)
     | > avg_log_mle:[92m -0.31783 [0m(-0.01810)
     | > avg_loss_dur:[92m 0.73437 [0m(-0.00624)


[4m[1m > EPOCH: 580/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:54:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.43480 [0m(+0.01825)
     | > avg_log_mle:[91m -0.29170 [0m(+0.02613)
     | > avg_loss_dur:[92m 0.72650 [0m(-0.00788)


[4m[1m > EPOCH: 581/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:55:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.47583 [0m(+0.04104)
     | > avg_log_mle:[91m -0.24895 [0m(+0.04275)
     | > avg_loss_dur:[92m 0.72478 [0m(-0.00171)


[4m[1m > EPOCH: 582/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:55:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.34455 [0m(-0.13129)
     | > avg_log_mle:[92m -0.33243 [0m(-0.08348)
     | > avg_loss_dur:[92m 0.67698 [0m(-0.04781)


[4m[1m > EPOCH: 583/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:55:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1750[0m
     | > loss: -0.06455  (-0.06455)
     | > log_mle: -0.36673  (-0.36673)
     | > loss_dur: 0.30218  (0.30218)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 15.33888  (15.33888)
     | > current_lr: 0.00015 
     | > step_time: 1.03200  (1.03195)
     | > loader_time: 0.43940  (0.43939)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.33953 [0m(-0.00501)
     | > avg_log_mle:[91m -0.30703 [0m(+0.02540)
     | > avg_loss_dur:[92m 0.64656 [0m(-0.03042)


[4m[1m > EPOCH: 584/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:55:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.35035 [0m(+0.01082)
     | > avg_log_mle:[92m -0.32636 [0m(-0.01933)
     | > avg_loss_dur:[91m 0.67671 [0m(+0.03015)


[4m[1m > EPOCH: 585/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:55:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.33672 [0m(-0.01363)
     | > avg_log_mle:[92m -0.32763 [0m(-0.00127)
     | > avg_loss_dur:[92m 0.66435 [0m(-0.01236)


[4m[1m > EPOCH: 586/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:55:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.34676 [0m(+0.01004)
     | > avg_log_mle:[91m -0.32523 [0m(+0.00240)
     | > avg_loss_dur:[91m 0.67199 [0m(+0.00763)


[4m[1m > EPOCH: 587/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:55:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.32597 [0m(-0.02078)
     | > avg_log_mle:[92m -0.35170 [0m(-0.02647)
     | > avg_loss_dur:[91m 0.67767 [0m(+0.00569)


[4m[1m > EPOCH: 588/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:56:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.27301 [0m(-0.05296)
     | > avg_log_mle:[91m -0.32597 [0m(+0.02573)
     | > avg_loss_dur:[92m 0.59898 [0m(-0.07869)

 > BEST MODEL : D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436\best_model_1767.pth

[4m[1m > EPOCH: 589/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:56:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.33167 [0m(+0.05865)
     | > avg_log_mle:[92m -0.33443 [0m(-0.00846)
     | > avg_loss_dur:[91m 0.66610 [0m(+0.06712)


[4m[1m > EPOCH: 590/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:56:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.43116 [0m(+0.09950)
     | > avg_log_mle:[91m -0.30458 [0m(+0.02985)
     | > avg_loss_dur:[91m 0.73574 [0m(+0.06965)


[4m[1m > EPOCH: 591/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:56:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1775[0m
     | > loss: -0.24418  (-0.14696)
     | > log_mle: -0.56549  (-0.46213)
     | > loss_dur: 0.32131  (0.31517)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 24.18537  (20.14215)
     | > current_lr: 0.00015 
     | > step_time: 0.40240  (0.72816)
     | > loader_time: 0.10410  (0.26124)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.40419 [0m(-0.02698)
     | > avg_log_mle:[91m -0.29676 [0m(+0.00782)
     | > avg_loss_dur:[92m 0.70095 [0m(-0.03479)


[4m[1m > EPOCH: 592/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:56:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.38810 [0m(-0.01609)
     | > avg_log_mle:[92m -0.31724 [0m(-0.02048)
     | > avg_loss_dur:[91m 0.70533 [0m(+0.00439)


[4m[1m > EPOCH: 593/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:56:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.54504 [0m(+0.15694)
     | > avg_log_mle:[91m -0.20634 [0m(+0.11090)
     | > avg_loss_dur:[91m 0.75137 [0m(+0.04604)


[4m[1m > EPOCH: 594/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:57:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.38855 [0m(-0.15649)
     | > avg_log_mle:[92m -0.33435 [0m(-0.12802)
     | > avg_loss_dur:[92m 0.72290 [0m(-0.02847)


[4m[1m > EPOCH: 595/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:57:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.40682 [0m(+0.01827)
     | > avg_log_mle:[91m -0.31744 [0m(+0.01691)
     | > avg_loss_dur:[91m 0.72426 [0m(+0.00135)


[4m[1m > EPOCH: 596/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:57:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[92m 0.39312 [0m(-0.01370)
     | > avg_log_mle:[91m -0.30580 [0m(+0.01164)
     | > avg_loss_dur:[92m 0.69892 [0m(-0.02534)


[4m[1m > EPOCH: 597/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:57:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.46027 [0m(+0.06715)
     | > avg_log_mle:[91m -0.30378 [0m(+0.00202)
     | > avg_loss_dur:[91m 0.76405 [0m(+0.06513)


[4m[1m > EPOCH: 598/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:57:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.42172 [0m(-0.03855)
     | > avg_log_mle:[92m -0.32764 [0m(-0.02386)
     | > avg_loss_dur:[92m 0.74936 [0m(-0.01469)


[4m[1m > EPOCH: 599/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:57:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.44332 [0m(+0.02160)
     | > avg_log_mle:[91m -0.30444 [0m(+0.02320)
     | > avg_loss_dur:[92m 0.74776 [0m(-0.00160)


[4m[1m > EPOCH: 600/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:57:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1800[0m
     | > loss: -0.18009  (-0.18009)
     | > log_mle: -0.44072  (-0.44072)
     | > loss_dur: 0.26063  (0.26063)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 28.06902  (28.06902)
     | > current_lr: 0.00015 
     | > step_time: 0.72770  (0.72766)
     | > loader_time: 0.32930  (0.32929)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.35809 [0m(-0.08523)
     | > avg_log_mle:[92m -0.32814 [0m(-0.02369)
     | > avg_loss_dur:[92m 0.68623 [0m(-0.06153)


[4m[1m > EPOCH: 601/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:58:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.37108 [0m(+0.01299)
     | > avg_log_mle:[91m -0.31096 [0m(+0.01718)
     | > avg_loss_dur:[92m 0.68204 [0m(-0.00419)


[4m[1m > EPOCH: 602/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:58:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.36325 [0m(-0.00783)
     | > avg_log_mle:[92m -0.32887 [0m(-0.01791)
     | > avg_loss_dur:[91m 0.69212 [0m(+0.01008)


[4m[1m > EPOCH: 603/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:58:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.41267 [0m(+0.04942)
     | > avg_log_mle:[91m -0.32050 [0m(+0.00837)
     | > avg_loss_dur:[91m 0.73317 [0m(+0.04105)


[4m[1m > EPOCH: 604/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:58:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.37484 [0m(-0.03784)
     | > avg_log_mle:[92m -0.34149 [0m(-0.02099)
     | > avg_loss_dur:[92m 0.71633 [0m(-0.01684)


[4m[1m > EPOCH: 605/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:58:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.44423 [0m(+0.06939)
     | > avg_log_mle:[91m -0.31809 [0m(+0.02341)
     | > avg_loss_dur:[91m 0.76231 [0m(+0.04599)


[4m[1m > EPOCH: 606/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:58:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.34332 [0m(-0.10091)
     | > avg_log_mle:[92m -0.32246 [0m(-0.00438)
     | > avg_loss_dur:[92m 0.66578 [0m(-0.09653)


[4m[1m > EPOCH: 607/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:59:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.35320 [0m(+0.00988)
     | > avg_log_mle:[92m -0.34106 [0m(-0.01860)
     | > avg_loss_dur:[91m 0.69426 [0m(+0.02848)


[4m[1m > EPOCH: 608/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:59:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1825[0m
     | > loss: -0.11430  (-0.11430)
     | > log_mle: -0.40588  (-0.40588)
     | > loss_dur: 0.29158  (0.29158)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 39.09854  (39.09854)
     | > current_lr: 0.00015 
     | > step_time: 1.03700  (1.03695)
     | > loader_time: 0.42740  (0.42739)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.33553 [0m(-0.01767)
     | > avg_log_mle:[91m -0.32156 [0m(+0.01950)
     | > avg_loss_dur:[92m 0.65710 [0m(-0.03717)


[4m[1m > EPOCH: 609/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:59:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.36366 [0m(+0.02813)
     | > avg_log_mle:[92m -0.32442 [0m(-0.00286)
     | > avg_loss_dur:[91m 0.68809 [0m(+0.03099)


[4m[1m > EPOCH: 610/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:59:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39521 [0m(+0.03155)
     | > avg_log_mle:[92m -0.33133 [0m(-0.00691)
     | > avg_loss_dur:[91m 0.72655 [0m(+0.03846)


[4m[1m > EPOCH: 611/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:59:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.30130 [0m(-0.09391)
     | > avg_log_mle:[92m -0.34257 [0m(-0.01124)
     | > avg_loss_dur:[92m 0.64388 [0m(-0.08267)


[4m[1m > EPOCH: 612/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:59:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.34662 [0m(+0.04531)
     | > avg_log_mle:[91m -0.32210 [0m(+0.02047)
     | > avg_loss_dur:[91m 0.66871 [0m(+0.02484)


[4m[1m > EPOCH: 613/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 05:59:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.30398 [0m(-0.04264)
     | > avg_log_mle:[92m -0.33358 [0m(-0.01148)
     | > avg_loss_dur:[92m 0.63755 [0m(-0.03116)


[4m[1m > EPOCH: 614/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:00:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[91m 0.30554 [0m(+0.00157)
     | > avg_log_mle:[92m -0.34139 [0m(-0.00781)
     | > avg_loss_dur:[91m 0.64693 [0m(+0.00938)


[4m[1m > EPOCH: 615/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:00:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.33551 [0m(+0.02996)
     | > avg_log_mle:[92m -0.34213 [0m(-0.00074)
     | > avg_loss_dur:[91m 0.67764 [0m(+0.03071)


[4m[1m > EPOCH: 616/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:00:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1850[0m
     | > loss: -0.30525  (-0.22181)
     | > log_mle: -0.61234  (-0.51997)
     | > loss_dur: 0.30708  (0.29816)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 78.14159  (71.18340)
     | > current_lr: 0.00015 
     | > step_time: 0.40540  (0.71815)
     | > loader_time: 0.10610  (0.26324)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.41508 [0m(+0.07957)
     | > avg_log_mle:[91m -0.30806 [0m(+0.03407)
     | > avg_loss_dur:[91m 0.72314 [0m(+0.04550)


[4m[1m > EPOCH: 617/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:00:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 0.38502 [0m(-0.03006)
     | > avg_log_mle:[92m -0.33752 [0m(-0.02946)
     | > avg_loss_dur:[92m 0.72254 [0m(-0.00060)


[4m[1m > EPOCH: 618/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:00:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00100)
     | > avg_loss:[92m 0.35982 [0m(-0.02520)
     | > avg_log_mle:[91m -0.32457 [0m(+0.01295)
     | > avg_loss_dur:[92m 0.68439 [0m(-0.03815)


[4m[1m > EPOCH: 619/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:00:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39335 [0m(+0.03353)
     | > avg_log_mle:[91m -0.31631 [0m(+0.00827)
     | > avg_loss_dur:[91m 0.70965 [0m(+0.02526)


[4m[1m > EPOCH: 620/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:00:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 0.36576 [0m(-0.02759)
     | > avg_log_mle:[91m -0.31437 [0m(+0.00193)
     | > avg_loss_dur:[92m 0.68014 [0m(-0.02952)


[4m[1m > EPOCH: 621/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:01:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[92m 0.35281 [0m(-0.01295)
     | > avg_log_mle:[92m -0.34122 [0m(-0.02685)
     | > avg_loss_dur:[91m 0.69403 [0m(+0.01389)


[4m[1m > EPOCH: 622/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:01:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39329 [0m(+0.04048)
     | > avg_log_mle:[91m -0.30516 [0m(+0.03606)
     | > avg_loss_dur:[91m 0.69845 [0m(+0.00442)


[4m[1m > EPOCH: 623/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:01:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.37169 [0m(-0.02160)
     | > avg_log_mle:[92m -0.33395 [0m(-0.02879)
     | > avg_loss_dur:[91m 0.70564 [0m(+0.00719)


[4m[1m > EPOCH: 624/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:01:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.46918 [0m(+0.09749)
     | > avg_log_mle:[91m -0.23096 [0m(+0.10299)
     | > avg_loss_dur:[92m 0.70014 [0m(-0.00550)


[4m[1m > EPOCH: 625/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:01:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1875[0m
     | > loss: -0.15647  (-0.15647)
     | > log_mle: -0.42168  (-0.42168)
     | > loss_dur: 0.26521  (0.26521)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 32.04551  (32.04551)
     | > current_lr: 0.00016 
     | > step_time: 0.73570  (0.73567)
     | > loader_time: 0.33130  (0.33130)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.39099 [0m(-0.07819)
     | > avg_log_mle:[92m -0.33349 [0m(-0.10252)
     | > avg_loss_dur:[91m 0.72448 [0m(+0.02434)


[4m[1m > EPOCH: 626/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:01:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.35534 [0m(-0.03565)
     | > avg_log_mle:[92m -0.33524 [0m(-0.00175)
     | > avg_loss_dur:[92m 0.69058 [0m(-0.03390)


[4m[1m > EPOCH: 627/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:02:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.33845 [0m(-0.01689)
     | > avg_log_mle:[91m -0.31549 [0m(+0.01975)
     | > avg_loss_dur:[92m 0.65394 [0m(-0.03664)


[4m[1m > EPOCH: 628/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:02:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.40672 [0m(+0.06827)
     | > avg_log_mle:[91m -0.30668 [0m(+0.00881)
     | > avg_loss_dur:[91m 0.71340 [0m(+0.05946)


[4m[1m > EPOCH: 629/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:02:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.36866 [0m(-0.03806)
     | > avg_log_mle:[92m -0.34044 [0m(-0.03377)
     | > avg_loss_dur:[92m 0.70911 [0m(-0.00429)


[4m[1m > EPOCH: 630/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:02:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[92m 0.33297 [0m(-0.03569)
     | > avg_log_mle:[92m -0.34061 [0m(-0.00016)
     | > avg_loss_dur:[92m 0.67358 [0m(-0.03553)


[4m[1m > EPOCH: 631/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:02:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.35859 [0m(+0.02562)
     | > avg_log_mle:[91m -0.32182 [0m(+0.01879)
     | > avg_loss_dur:[91m 0.68041 [0m(+0.00683)


[4m[1m > EPOCH: 632/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:02:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.28502 [0m(-0.07357)
     | > avg_log_mle:[91m -0.31748 [0m(+0.00434)
     | > avg_loss_dur:[92m 0.60250 [0m(-0.07791)


[4m[1m > EPOCH: 633/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:02:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1900[0m
     | > loss: -0.11539  (-0.11539)
     | > log_mle: -0.40864  (-0.40864)
     | > loss_dur: 0.29325  (0.29325)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 41.28393  (41.28393)
     | > current_lr: 0.00016 
     | > step_time: 1.03500  (1.03505)
     | > loader_time: 0.41940  (0.41938)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.31858 [0m(+0.03357)
     | > avg_log_mle:[92m -0.32167 [0m(-0.00419)
     | > avg_loss_dur:[91m 0.64025 [0m(+0.03775)


[4m[1m > EPOCH: 634/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:03:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.36425 [0m(+0.04567)
     | > avg_log_mle:[92m -0.32521 [0m(-0.00354)
     | > avg_loss_dur:[91m 0.68946 [0m(+0.04921)


[4m[1m > EPOCH: 635/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:03:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.38460 [0m(+0.02035)
     | > avg_log_mle:[91m -0.31308 [0m(+0.01212)
     | > avg_loss_dur:[91m 0.69769 [0m(+0.00823)


[4m[1m > EPOCH: 636/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:03:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.42638 [0m(+0.04177)
     | > avg_log_mle:[91m -0.29462 [0m(+0.01846)
     | > avg_loss_dur:[91m 0.72100 [0m(+0.02331)


[4m[1m > EPOCH: 637/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:03:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.31743 [0m(-0.10895)
     | > avg_log_mle:[92m -0.31966 [0m(-0.02504)
     | > avg_loss_dur:[92m 0.63709 [0m(-0.08391)


[4m[1m > EPOCH: 638/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:03:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.37299 [0m(+0.05557)
     | > avg_log_mle:[92m -0.33440 [0m(-0.01474)
     | > avg_loss_dur:[91m 0.70740 [0m(+0.07031)


[4m[1m > EPOCH: 639/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:03:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.37503 [0m(+0.00204)
     | > avg_log_mle:[91m -0.32803 [0m(+0.00637)
     | > avg_loss_dur:[92m 0.70306 [0m(-0.00434)


[4m[1m > EPOCH: 640/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:04:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.37268 [0m(-0.00235)
     | > avg_log_mle:[92m -0.33099 [0m(-0.00296)
     | > avg_loss_dur:[91m 0.70367 [0m(+0.00060)


[4m[1m > EPOCH: 641/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:04:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 1925[0m
     | > loss: -0.35216  (-0.25035)
     | > log_mle: -0.64892  (-0.54273)
     | > loss_dur: 0.29676  (0.29237)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 30.55378  (23.08076)
     | > current_lr: 0.00016 
     | > step_time: 0.40240  (0.72316)
     | > loader_time: 0.10610  (0.26074)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.30187 [0m(-0.07081)
     | > avg_log_mle:[92m -0.33948 [0m(-0.00849)
     | > avg_loss_dur:[92m 0.64135 [0m(-0.06232)


[4m[1m > EPOCH: 642/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:04:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.44348 [0m(+0.14162)
     | > avg_log_mle:[91m -0.31799 [0m(+0.02149)
     | > avg_loss_dur:[91m 0.76148 [0m(+0.12013)


[4m[1m > EPOCH: 643/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:04:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.37039 [0m(-0.07309)
     | > avg_log_mle:[92m -0.33284 [0m(-0.01485)
     | > avg_loss_dur:[92m 0.70323 [0m(-0.05825)


[4m[1m > EPOCH: 644/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:04:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.36552 [0m(-0.00487)
     | > avg_log_mle:[92m -0.33646 [0m(-0.00362)
     | > avg_loss_dur:[92m 0.70198 [0m(-0.00125)


[4m[1m > EPOCH: 645/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:04:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.37441 [0m(+0.00889)
     | > avg_log_mle:[91m -0.30394 [0m(+0.03252)
     | > avg_loss_dur:[92m 0.67835 [0m(-0.02363)


[4m[1m > EPOCH: 646/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:04:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.38133 [0m(+0.00692)
     | > avg_log_mle:[92m -0.32289 [0m(-0.01895)
     | > avg_loss_dur:[91m 0.70423 [0m(+0.02588)


[4m[1m > EPOCH: 647/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:05:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.33149 [0m(-0.04984)
     | > avg_log_mle:[92m -0.32757 [0m(-0.00467)
     | > avg_loss_dur:[92m 0.65906 [0m(-0.04517)


[4m[1m > EPOCH: 648/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:05:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.40637 [0m(+0.07488)
     | > avg_log_mle:[91m -0.32444 [0m(+0.00313)
     | > avg_loss_dur:[91m 0.73081 [0m(+0.07175)


[4m[1m > EPOCH: 649/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:05:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.37353 [0m(-0.03284)
     | > avg_log_mle:[91m -0.32042 [0m(+0.00401)
     | > avg_loss_dur:[92m 0.69395 [0m(-0.03686)


[4m[1m > EPOCH: 650/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:05:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 1950[0m
     | > loss: -0.25431  (-0.25431)
     | > log_mle: -0.50523  (-0.50523)
     | > loss_dur: 0.25092  (0.25092)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 38.08582  (38.08582)
     | > current_lr: 0.00016 
     | > step_time: 0.72870  (0.72866)
     | > loader_time: 0.31230  (0.31228)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.34202 [0m(-0.03150)
     | > avg_log_mle:[92m -0.33173 [0m(-0.01130)
     | > avg_loss_dur:[92m 0.67375 [0m(-0.02020)


[4m[1m > EPOCH: 651/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:05:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.37999 [0m(+0.03797)
     | > avg_log_mle:[91m -0.31630 [0m(+0.01543)
     | > avg_loss_dur:[91m 0.69630 [0m(+0.02255)


[4m[1m > EPOCH: 652/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:05:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.35919 [0m(-0.02080)
     | > avg_log_mle:[92m -0.31962 [0m(-0.00332)
     | > avg_loss_dur:[92m 0.67882 [0m(-0.01748)


[4m[1m > EPOCH: 653/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:05:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.50969 [0m(+0.15049)
     | > avg_log_mle:[91m -0.24360 [0m(+0.07603)
     | > avg_loss_dur:[91m 0.75328 [0m(+0.07446)


[4m[1m > EPOCH: 654/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:06:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.37033 [0m(-0.13936)
     | > avg_log_mle:[92m -0.30668 [0m(-0.06309)
     | > avg_loss_dur:[92m 0.67701 [0m(-0.07627)


[4m[1m > EPOCH: 655/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:06:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.52738 [0m(+0.15705)
     | > avg_log_mle:[91m -0.25553 [0m(+0.05115)
     | > avg_loss_dur:[91m 0.78291 [0m(+0.10590)


[4m[1m > EPOCH: 656/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:06:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.36222 [0m(-0.16516)
     | > avg_log_mle:[92m -0.31611 [0m(-0.06058)
     | > avg_loss_dur:[92m 0.67833 [0m(-0.10458)


[4m[1m > EPOCH: 657/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:06:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.35024 [0m(-0.01198)
     | > avg_log_mle:[92m -0.31745 [0m(-0.00134)
     | > avg_loss_dur:[92m 0.66769 [0m(-0.01064)


[4m[1m > EPOCH: 658/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:06:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 1975[0m
     | > loss: -0.13561  (-0.13561)
     | > log_mle: -0.42381  (-0.42381)
     | > loss_dur: 0.28820  (0.28820)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 9.96634  (9.96634)
     | > current_lr: 0.00016 
     | > step_time: 1.02990  (1.02994)
     | > loader_time: 0.42440  (0.42438)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.41780 [0m(+0.06756)
     | > avg_log_mle:[92m -0.31880 [0m(-0.00136)
     | > avg_loss_dur:[91m 0.73660 [0m(+0.06891)


[4m[1m > EPOCH: 659/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:06:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.48923 [0m(+0.07143)
     | > avg_log_mle:[91m -0.31724 [0m(+0.00157)
     | > avg_loss_dur:[91m 0.80647 [0m(+0.06986)


[4m[1m > EPOCH: 660/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:07:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.39085 [0m(-0.09838)
     | > avg_log_mle:[91m -0.29834 [0m(+0.01890)
     | > avg_loss_dur:[92m 0.68918 [0m(-0.11728)


[4m[1m > EPOCH: 661/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:07:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.35297 [0m(-0.03788)
     | > avg_log_mle:[92m -0.32806 [0m(-0.02972)
     | > avg_loss_dur:[92m 0.68103 [0m(-0.00815)


[4m[1m > EPOCH: 662/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:07:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.33513 [0m(-0.01783)
     | > avg_log_mle:[91m -0.32648 [0m(+0.00159)
     | > avg_loss_dur:[92m 0.66161 [0m(-0.01942)


[4m[1m > EPOCH: 663/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:07:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.35967 [0m(+0.02453)
     | > avg_log_mle:[91m -0.30933 [0m(+0.01715)
     | > avg_loss_dur:[91m 0.66900 [0m(+0.00739)


[4m[1m > EPOCH: 664/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:07:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.36289 [0m(+0.00323)
     | > avg_log_mle:[92m -0.31424 [0m(-0.00491)
     | > avg_loss_dur:[91m 0.67713 [0m(+0.00813)


[4m[1m > EPOCH: 665/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:07:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.41275 [0m(+0.04985)
     | > avg_log_mle:[92m -0.32356 [0m(-0.00932)
     | > avg_loss_dur:[91m 0.73631 [0m(+0.05918)


[4m[1m > EPOCH: 666/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:07:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2000[0m
     | > loss: -0.38471  (-0.27403)
     | > log_mle: -0.66814  (-0.56058)
     | > loss_dur: 0.28343  (0.28655)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 19.26420  (18.87663)
     | > current_lr: 0.00017 
     | > step_time: 0.40440  (0.71865)
     | > loader_time: 0.10410  (0.26975)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.35079 [0m(-0.06196)
     | > avg_log_mle:[91m -0.32017 [0m(+0.00339)
     | > avg_loss_dur:[92m 0.67097 [0m(-0.06534)


[4m[1m > EPOCH: 667/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:08:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.34273 [0m(-0.00806)
     | > avg_log_mle:[91m -0.31343 [0m(+0.00674)
     | > avg_loss_dur:[92m 0.65616 [0m(-0.01480)


[4m[1m > EPOCH: 668/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:08:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.30595 [0m(-0.03678)
     | > avg_log_mle:[92m -0.32185 [0m(-0.00841)
     | > avg_loss_dur:[92m 0.62779 [0m(-0.02837)


[4m[1m > EPOCH: 669/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:08:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.37498 [0m(+0.06904)
     | > avg_log_mle:[91m -0.29229 [0m(+0.02955)
     | > avg_loss_dur:[91m 0.66728 [0m(+0.03948)


[4m[1m > EPOCH: 670/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:08:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39241 [0m(+0.01743)
     | > avg_log_mle:[92m -0.32860 [0m(-0.03630)
     | > avg_loss_dur:[91m 0.72101 [0m(+0.05373)


[4m[1m > EPOCH: 671/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:08:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.41877 [0m(+0.02636)
     | > avg_log_mle:[91m -0.30545 [0m(+0.02315)
     | > avg_loss_dur:[91m 0.72422 [0m(+0.00321)


[4m[1m > EPOCH: 672/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:08:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.39623 [0m(-0.02254)
     | > avg_log_mle:[92m -0.32547 [0m(-0.02002)
     | > avg_loss_dur:[92m 0.72170 [0m(-0.00252)


[4m[1m > EPOCH: 673/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:09:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.43567 [0m(+0.03943)
     | > avg_log_mle:[91m -0.31232 [0m(+0.01315)
     | > avg_loss_dur:[91m 0.74799 [0m(+0.02629)


[4m[1m > EPOCH: 674/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:09:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.39077 [0m(-0.04489)
     | > avg_log_mle:[92m -0.32752 [0m(-0.01519)
     | > avg_loss_dur:[92m 0.71829 [0m(-0.02970)


[4m[1m > EPOCH: 675/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:09:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2025[0m
     | > loss: -0.28430  (-0.28430)
     | > log_mle: -0.52985  (-0.52985)
     | > loss_dur: 0.24555  (0.24555)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 22.02848  (22.02848)
     | > current_lr: 0.00017 
     | > step_time: 0.72870  (0.72866)
     | > loader_time: 0.32430  (0.32428)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.37088 [0m(-0.01989)
     | > avg_log_mle:[91m -0.30760 [0m(+0.01992)
     | > avg_loss_dur:[92m 0.67848 [0m(-0.03980)


[4m[1m > EPOCH: 676/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:09:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.40728 [0m(+0.03639)
     | > avg_log_mle:[91m -0.27021 [0m(+0.03739)
     | > avg_loss_dur:[92m 0.67749 [0m(-0.00100)


[4m[1m > EPOCH: 677/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:09:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[91m 0.42729 [0m(+0.02001)
     | > avg_log_mle:[92m -0.30530 [0m(-0.03508)
     | > avg_loss_dur:[91m 0.73259 [0m(+0.05510)


[4m[1m > EPOCH: 678/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:09:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00801 [0m(+0.00000)
     | > avg_loss:[91m 0.47397 [0m(+0.04668)
     | > avg_log_mle:[91m -0.23876 [0m(+0.06654)
     | > avg_loss_dur:[92m 0.71273 [0m(-0.01986)


[4m[1m > EPOCH: 679/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:09:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.40518 [0m(-0.06879)
     | > avg_log_mle:[92m -0.25177 [0m(-0.01301)
     | > avg_loss_dur:[92m 0.65695 [0m(-0.05578)


[4m[1m > EPOCH: 680/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:10:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 0.40352 [0m(-0.00166)
     | > avg_log_mle:[92m -0.28209 [0m(-0.03032)
     | > avg_loss_dur:[91m 0.68562 [0m(+0.02867)


[4m[1m > EPOCH: 681/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:10:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[91m 0.47470 [0m(+0.07118)
     | > avg_log_mle:[91m -0.27945 [0m(+0.00264)
     | > avg_loss_dur:[91m 0.75416 [0m(+0.06854)


[4m[1m > EPOCH: 682/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:10:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.39134 [0m(-0.08336)
     | > avg_log_mle:[92m -0.29528 [0m(-0.01583)
     | > avg_loss_dur:[92m 0.68662 [0m(-0.06754)


[4m[1m > EPOCH: 683/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:10:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2050[0m
     | > loss: -0.14970  (-0.14970)
     | > log_mle: -0.43485  (-0.43485)
     | > loss_dur: 0.28515  (0.28515)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 15.85433  (15.85433)
     | > current_lr: 0.00017 
     | > step_time: 1.03990  (1.03994)
     | > loader_time: 0.42140  (0.42138)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.41749 [0m(+0.02615)
     | > avg_log_mle:[92m -0.30593 [0m(-0.01066)
     | > avg_loss_dur:[91m 0.72343 [0m(+0.03681)


[4m[1m > EPOCH: 684/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:10:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.37042 [0m(-0.04707)
     | > avg_log_mle:[92m -0.31860 [0m(-0.01266)
     | > avg_loss_dur:[92m 0.68901 [0m(-0.03441)


[4m[1m > EPOCH: 685/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:10:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.35992 [0m(-0.01049)
     | > avg_log_mle:[92m -0.32236 [0m(-0.00377)
     | > avg_loss_dur:[92m 0.68229 [0m(-0.00673)


[4m[1m > EPOCH: 686/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:10:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.41903 [0m(+0.05910)
     | > avg_log_mle:[91m -0.29714 [0m(+0.02522)
     | > avg_loss_dur:[91m 0.71617 [0m(+0.03389)


[4m[1m > EPOCH: 687/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:11:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.38275 [0m(-0.03628)
     | > avg_log_mle:[92m -0.31656 [0m(-0.01941)
     | > avg_loss_dur:[92m 0.69930 [0m(-0.01687)


[4m[1m > EPOCH: 688/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:11:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00200)
     | > avg_loss:[92m 0.33427 [0m(-0.04847)
     | > avg_log_mle:[91m -0.31488 [0m(+0.00168)
     | > avg_loss_dur:[92m 0.64915 [0m(-0.05015)


[4m[1m > EPOCH: 689/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:11:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[92m 0.33044 [0m(-0.00384)
     | > avg_log_mle:[92m -0.32365 [0m(-0.00877)
     | > avg_loss_dur:[91m 0.65408 [0m(+0.00493)


[4m[1m > EPOCH: 690/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:11:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.30677 [0m(-0.02367)
     | > avg_log_mle:[91m -0.32025 [0m(+0.00340)
     | > avg_loss_dur:[92m 0.62702 [0m(-0.02707)


[4m[1m > EPOCH: 691/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:11:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2075[0m
     | > loss: -0.42589  (-0.30696)
     | > log_mle: -0.69347  (-0.58143)
     | > loss_dur: 0.26758  (0.27447)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 67.52007  (57.96931)
     | > current_lr: 0.00017 
     | > step_time: 0.40640  (0.72066)
     | > loader_time: 0.10010  (0.26373)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.31759 [0m(+0.01082)
     | > avg_log_mle:[91m -0.31244 [0m(+0.00781)
     | > avg_loss_dur:[91m 0.63003 [0m(+0.00301)


[4m[1m > EPOCH: 692/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:11:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.35110 [0m(+0.03350)
     | > avg_log_mle:[92m -0.32340 [0m(-0.01097)
     | > avg_loss_dur:[91m 0.67450 [0m(+0.04447)


[4m[1m > EPOCH: 693/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:12:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.35506 [0m(+0.00396)
     | > avg_log_mle:[91m -0.30871 [0m(+0.01469)
     | > avg_loss_dur:[92m 0.66377 [0m(-0.01073)


[4m[1m > EPOCH: 694/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:12:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.34147 [0m(-0.01358)
     | > avg_log_mle:[92m -0.32768 [0m(-0.01897)
     | > avg_loss_dur:[91m 0.66915 [0m(+0.00538)


[4m[1m > EPOCH: 695/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:12:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39513 [0m(+0.05365)
     | > avg_log_mle:[91m -0.31878 [0m(+0.00890)
     | > avg_loss_dur:[91m 0.71390 [0m(+0.04475)


[4m[1m > EPOCH: 696/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:12:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.40069 [0m(+0.00557)
     | > avg_log_mle:[91m -0.30478 [0m(+0.01400)
     | > avg_loss_dur:[92m 0.70547 [0m(-0.00843)


[4m[1m > EPOCH: 697/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:12:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.38272 [0m(-0.01797)
     | > avg_log_mle:[92m -0.30833 [0m(-0.00355)
     | > avg_loss_dur:[92m 0.69105 [0m(-0.01441)


[4m[1m > EPOCH: 698/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:12:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.37942 [0m(-0.00331)
     | > avg_log_mle:[92m -0.31018 [0m(-0.00185)
     | > avg_loss_dur:[92m 0.68960 [0m(-0.00145)


[4m[1m > EPOCH: 699/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:12:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.37655 [0m(-0.00287)
     | > avg_log_mle:[92m -0.31233 [0m(-0.00215)
     | > avg_loss_dur:[92m 0.68888 [0m(-0.00072)


[4m[1m > EPOCH: 700/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:13:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2100[0m
     | > loss: -0.32275  (-0.32275)
     | > log_mle: -0.55911  (-0.55911)
     | > loss_dur: 0.23635  (0.23635)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 18.67813  (18.67813)
     | > current_lr: 0.00017 
     | > step_time: 0.72570  (0.72567)
     | > loader_time: 0.31830  (0.31829)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.34989 [0m(-0.02666)
     | > avg_log_mle:[91m -0.30132 [0m(+0.01101)
     | > avg_loss_dur:[92m 0.65121 [0m(-0.03766)


[4m[1m > EPOCH: 701/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:13:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.35726 [0m(+0.00737)
     | > avg_log_mle:[92m -0.31507 [0m(-0.01374)
     | > avg_loss_dur:[91m 0.67233 [0m(+0.02111)


[4m[1m > EPOCH: 702/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:13:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.38783 [0m(+0.03057)
     | > avg_log_mle:[91m -0.30968 [0m(+0.00539)
     | > avg_loss_dur:[91m 0.69751 [0m(+0.02518)


[4m[1m > EPOCH: 703/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:13:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.39670 [0m(+0.00887)
     | > avg_log_mle:[91m -0.30623 [0m(+0.00345)
     | > avg_loss_dur:[91m 0.70293 [0m(+0.00542)


[4m[1m > EPOCH: 704/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:13:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.40281 [0m(+0.00611)
     | > avg_log_mle:[92m -0.31009 [0m(-0.00387)
     | > avg_loss_dur:[91m 0.71290 [0m(+0.00998)


[4m[1m > EPOCH: 705/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:13:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.35553 [0m(-0.04728)
     | > avg_log_mle:[92m -0.31231 [0m(-0.00222)
     | > avg_loss_dur:[92m 0.66784 [0m(-0.04506)


[4m[1m > EPOCH: 706/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:13:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.38768 [0m(+0.03216)
     | > avg_log_mle:[91m -0.30572 [0m(+0.00660)
     | > avg_loss_dur:[91m 0.69340 [0m(+0.02556)


[4m[1m > EPOCH: 707/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:14:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.34889 [0m(-0.03880)
     | > avg_log_mle:[91m -0.30040 [0m(+0.00532)
     | > avg_loss_dur:[92m 0.64928 [0m(-0.04412)


[4m[1m > EPOCH: 708/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:14:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2125[0m
     | > loss: -0.21087  (-0.21087)
     | > log_mle: -0.48454  (-0.48454)
     | > loss_dur: 0.27366  (0.27366)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 26.92874  (26.92874)
     | > current_lr: 0.00018 
     | > step_time: 1.03090  (1.03095)
     | > loader_time: 0.43340  (0.43339)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.42250 [0m(+0.07361)
     | > avg_log_mle:[91m -0.28859 [0m(+0.01181)
     | > avg_loss_dur:[91m 0.71109 [0m(+0.06180)


[4m[1m > EPOCH: 709/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:14:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.35992 [0m(-0.06257)
     | > avg_log_mle:[92m -0.30397 [0m(-0.01538)
     | > avg_loss_dur:[92m 0.66389 [0m(-0.04719)


[4m[1m > EPOCH: 710/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:14:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.44113 [0m(+0.08121)
     | > avg_log_mle:[91m -0.29267 [0m(+0.01130)
     | > avg_loss_dur:[91m 0.73380 [0m(+0.06991)


[4m[1m > EPOCH: 711/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:14:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.37066 [0m(-0.07047)
     | > avg_log_mle:[91m -0.29130 [0m(+0.00137)
     | > avg_loss_dur:[92m 0.66196 [0m(-0.07184)


[4m[1m > EPOCH: 712/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:14:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.45923 [0m(+0.08857)
     | > avg_log_mle:[91m -0.28149 [0m(+0.00982)
     | > avg_loss_dur:[91m 0.74072 [0m(+0.07875)


[4m[1m > EPOCH: 713/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:15:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.38208 [0m(-0.07716)
     | > avg_log_mle:[92m -0.28230 [0m(-0.00081)
     | > avg_loss_dur:[92m 0.66437 [0m(-0.07634)


[4m[1m > EPOCH: 714/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:15:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.37874 [0m(-0.00333)
     | > avg_log_mle:[92m -0.30824 [0m(-0.02595)
     | > avg_loss_dur:[91m 0.68699 [0m(+0.02261)


[4m[1m > EPOCH: 715/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:15:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.43786 [0m(+0.05911)
     | > avg_log_mle:[91m -0.24246 [0m(+0.06578)
     | > avg_loss_dur:[92m 0.68032 [0m(-0.00667)


[4m[1m > EPOCH: 716/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:15:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2150[0m
     | > loss: -0.44934  (-0.30691)
     | > log_mle: -0.70081  (-0.57057)
     | > loss_dur: 0.25147  (0.26366)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 28.94624  (26.27694)
     | > current_lr: 0.00018 
     | > step_time: 0.39740  (0.71715)
     | > loader_time: 0.10310  (0.26574)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.41977 [0m(-0.01809)
     | > avg_log_mle:[92m -0.30478 [0m(-0.06232)
     | > avg_loss_dur:[91m 0.72455 [0m(+0.04423)


[4m[1m > EPOCH: 717/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:15:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.40104 [0m(-0.01873)
     | > avg_log_mle:[92m -0.30524 [0m(-0.00045)
     | > avg_loss_dur:[92m 0.70628 [0m(-0.01828)


[4m[1m > EPOCH: 718/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:15:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.55745 [0m(+0.15642)
     | > avg_log_mle:[91m -0.26327 [0m(+0.04197)
     | > avg_loss_dur:[91m 0.82072 [0m(+0.11444)


[4m[1m > EPOCH: 719/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:15:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[92m 0.30595 [0m(-0.25150)
     | > avg_log_mle:[92m -0.31681 [0m(-0.05354)
     | > avg_loss_dur:[92m 0.62276 [0m(-0.19796)


[4m[1m > EPOCH: 720/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:16:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.41017 [0m(+0.10422)
     | > avg_log_mle:[91m -0.28846 [0m(+0.02835)
     | > avg_loss_dur:[91m 0.69863 [0m(+0.07587)


[4m[1m > EPOCH: 721/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:16:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[91m 0.45376 [0m(+0.04359)
     | > avg_log_mle:[92m -0.28873 [0m(-0.00028)
     | > avg_loss_dur:[91m 0.74250 [0m(+0.04387)


[4m[1m > EPOCH: 722/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:16:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.37608 [0m(-0.07768)
     | > avg_log_mle:[92m -0.30368 [0m(-0.01494)
     | > avg_loss_dur:[92m 0.67975 [0m(-0.06274)


[4m[1m > EPOCH: 723/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:16:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.37466 [0m(-0.00142)
     | > avg_log_mle:[92m -0.30569 [0m(-0.00202)
     | > avg_loss_dur:[91m 0.68035 [0m(+0.00060)


[4m[1m > EPOCH: 724/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:16:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.38694 [0m(+0.01229)
     | > avg_log_mle:[91m -0.28954 [0m(+0.01615)
     | > avg_loss_dur:[92m 0.67649 [0m(-0.00386)


[4m[1m > EPOCH: 725/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:16:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2175[0m
     | > loss: -0.28824  (-0.28824)
     | > log_mle: -0.52594  (-0.52594)
     | > loss_dur: 0.23770  (0.23770)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 10.08979  (10.08979)
     | > current_lr: 0.00018 
     | > step_time: 0.82580  (0.82575)
     | > loader_time: 0.32130  (0.32128)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.45520 [0m(+0.06826)
     | > avg_log_mle:[92m -0.29479 [0m(-0.00525)
     | > avg_loss_dur:[91m 0.74999 [0m(+0.07350)


[4m[1m > EPOCH: 726/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:17:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 0.37805 [0m(-0.07715)
     | > avg_log_mle:[92m -0.30871 [0m(-0.01392)
     | > avg_loss_dur:[92m 0.68676 [0m(-0.06323)


[4m[1m > EPOCH: 727/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:17:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.39946 [0m(+0.02141)
     | > avg_log_mle:[91m -0.30406 [0m(+0.00465)
     | > avg_loss_dur:[91m 0.70352 [0m(+0.01676)


[4m[1m > EPOCH: 728/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:17:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.41649 [0m(+0.01703)
     | > avg_log_mle:[91m -0.28377 [0m(+0.02029)
     | > avg_loss_dur:[92m 0.70025 [0m(-0.00327)


[4m[1m > EPOCH: 729/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:17:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.49560 [0m(+0.07911)
     | > avg_log_mle:[91m -0.28261 [0m(+0.00115)
     | > avg_loss_dur:[91m 0.77821 [0m(+0.07796)


[4m[1m > EPOCH: 730/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:17:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.46442 [0m(-0.03118)
     | > avg_log_mle:[92m -0.28445 [0m(-0.00184)
     | > avg_loss_dur:[92m 0.74887 [0m(-0.02934)


[4m[1m > EPOCH: 731/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:17:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.52989 [0m(+0.06547)
     | > avg_log_mle:[92m -0.28994 [0m(-0.00549)
     | > avg_loss_dur:[91m 0.81983 [0m(+0.07096)


[4m[1m > EPOCH: 732/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:17:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.47581 [0m(-0.05408)
     | > avg_log_mle:[91m -0.28821 [0m(+0.00173)
     | > avg_loss_dur:[92m 0.76401 [0m(-0.05582)


[4m[1m > EPOCH: 733/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:18:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2200[0m
     | > loss: -0.20562  (-0.20562)
     | > log_mle: -0.47931  (-0.47931)
     | > loss_dur: 0.27369  (0.27369)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 27.76603  (27.76603)
     | > current_lr: 0.00018 
     | > step_time: 1.03800  (1.03795)
     | > loader_time: 0.41740  (0.41738)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.40222 [0m(-0.07359)
     | > avg_log_mle:[91m -0.27684 [0m(+0.01137)
     | > avg_loss_dur:[92m 0.67906 [0m(-0.08495)


[4m[1m > EPOCH: 734/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:18:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.34714 [0m(-0.05508)
     | > avg_log_mle:[92m -0.29216 [0m(-0.01532)
     | > avg_loss_dur:[92m 0.63930 [0m(-0.03976)


[4m[1m > EPOCH: 735/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:18:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.39100 [0m(+0.04387)
     | > avg_log_mle:[91m -0.28827 [0m(+0.00389)
     | > avg_loss_dur:[91m 0.67927 [0m(+0.03998)


[4m[1m > EPOCH: 736/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:18:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.44518 [0m(+0.05417)
     | > avg_log_mle:[92m -0.29489 [0m(-0.00662)
     | > avg_loss_dur:[91m 0.74007 [0m(+0.06080)


[4m[1m > EPOCH: 737/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:18:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.42163 [0m(-0.02355)
     | > avg_log_mle:[91m -0.28967 [0m(+0.00522)
     | > avg_loss_dur:[92m 0.71130 [0m(-0.02877)


[4m[1m > EPOCH: 738/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:18:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.40377 [0m(-0.01786)
     | > avg_log_mle:[92m -0.28973 [0m(-0.00006)
     | > avg_loss_dur:[92m 0.69350 [0m(-0.01780)


[4m[1m > EPOCH: 739/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:19:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.47844 [0m(+0.07467)
     | > avg_log_mle:[91m -0.27482 [0m(+0.01491)
     | > avg_loss_dur:[91m 0.75326 [0m(+0.05976)


[4m[1m > EPOCH: 740/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:19:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.47860 [0m(+0.00016)
     | > avg_log_mle:[91m -0.25104 [0m(+0.02378)
     | > avg_loss_dur:[92m 0.72964 [0m(-0.02362)


[4m[1m > EPOCH: 741/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:19:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2225[0m
     | > loss: -0.52075  (-0.37063)
     | > log_mle: -0.74910  (-0.61995)
     | > loss_dur: 0.22835  (0.24932)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 30.47394  (23.27007)
     | > current_lr: 0.00019 
     | > step_time: 0.40240  (0.71915)
     | > loader_time: 0.10110  (0.26524)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.43859 [0m(-0.04001)
     | > avg_log_mle:[92m -0.26357 [0m(-0.01253)
     | > avg_loss_dur:[92m 0.70215 [0m(-0.02748)


[4m[1m > EPOCH: 742/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:19:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.43322 [0m(-0.00536)
     | > avg_log_mle:[92m -0.27995 [0m(-0.01639)
     | > avg_loss_dur:[91m 0.71318 [0m(+0.01102)


[4m[1m > EPOCH: 743/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:19:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.01001 [0m(+0.00000)
     | > avg_loss:[91m 0.50438 [0m(+0.07116)
     | > avg_log_mle:[91m -0.22908 [0m(+0.05087)
     | > avg_loss_dur:[91m 0.73346 [0m(+0.02028)


[4m[1m > EPOCH: 744/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:19:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 0.40526 [0m(-0.09912)
     | > avg_log_mle:[92m -0.29937 [0m(-0.07029)
     | > avg_loss_dur:[92m 0.70463 [0m(-0.02883)


[4m[1m > EPOCH: 745/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:19:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.62769 [0m(+0.22243)
     | > avg_log_mle:[91m -0.09707 [0m(+0.20231)
     | > avg_loss_dur:[91m 0.72475 [0m(+0.02012)


[4m[1m > EPOCH: 746/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:20:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.69352 [0m(+0.06584)
     | > avg_log_mle:[91m -0.04013 [0m(+0.05693)
     | > avg_loss_dur:[91m 0.73366 [0m(+0.00890)


[4m[1m > EPOCH: 747/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:20:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.89385 [0m(+0.20033)
     | > avg_log_mle:[92m -0.22669 [0m(-0.18655)
     | > avg_loss_dur:[91m 1.12054 [0m(+0.38689)


[4m[1m > EPOCH: 748/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:20:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.48256 [0m(-0.41129)
     | > avg_log_mle:[91m -0.21875 [0m(+0.00794)
     | > avg_loss_dur:[92m 0.70131 [0m(-0.41924)


[4m[1m > EPOCH: 749/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:20:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.47263 [0m(-0.00993)
     | > avg_log_mle:[92m -0.24445 [0m(-0.02570)
     | > avg_loss_dur:[91m 0.71708 [0m(+0.01577)


[4m[1m > EPOCH: 750/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:20:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2250[0m
     | > loss: -0.17469  (-0.17469)
     | > log_mle: -0.42459  (-0.42459)
     | > loss_dur: 0.24990  (0.24990)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 6.87294  (6.87294)
     | > current_lr: 0.00019 
     | > step_time: 0.86680  (0.86679)
     | > loader_time: 0.32530  (0.32530)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.55618 [0m(+0.08355)
     | > avg_log_mle:[92m -0.24639 [0m(-0.00194)
     | > avg_loss_dur:[91m 0.80257 [0m(+0.08549)


[4m[1m > EPOCH: 751/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:20:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.51472 [0m(-0.04146)
     | > avg_log_mle:[92m -0.25027 [0m(-0.00388)
     | > avg_loss_dur:[92m 0.76499 [0m(-0.03758)


[4m[1m > EPOCH: 752/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:21:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.41209 [0m(-0.10262)
     | > avg_log_mle:[92m -0.28380 [0m(-0.03352)
     | > avg_loss_dur:[92m 0.69589 [0m(-0.06910)


[4m[1m > EPOCH: 753/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:21:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.50558 [0m(+0.09349)
     | > avg_log_mle:[91m -0.23933 [0m(+0.04446)
     | > avg_loss_dur:[91m 0.74492 [0m(+0.04903)


[4m[1m > EPOCH: 754/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:21:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.48437 [0m(-0.02122)
     | > avg_log_mle:[92m -0.29468 [0m(-0.05535)
     | > avg_loss_dur:[91m 0.77905 [0m(+0.03413)


[4m[1m > EPOCH: 755/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:21:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.53915 [0m(+0.05478)
     | > avg_log_mle:[91m -0.27500 [0m(+0.01968)
     | > avg_loss_dur:[91m 0.81415 [0m(+0.03510)


[4m[1m > EPOCH: 756/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:21:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.64114 [0m(+0.10199)
     | > avg_log_mle:[91m -0.21414 [0m(+0.06087)
     | > avg_loss_dur:[91m 0.85528 [0m(+0.04112)


[4m[1m > EPOCH: 757/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:21:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.44898 [0m(-0.19216)
     | > avg_log_mle:[92m -0.27800 [0m(-0.06386)
     | > avg_loss_dur:[92m 0.72698 [0m(-0.12830)


[4m[1m > EPOCH: 758/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:21:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2275[0m
     | > loss: -0.15303  (-0.15303)
     | > log_mle: -0.43946  (-0.43946)
     | > loss_dur: 0.28642  (0.28642)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 9.89924  (9.89924)
     | > current_lr: 0.00019 
     | > step_time: 1.03990  (1.03995)
     | > loader_time: 0.43040  (0.43039)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.41486 [0m(-0.03412)
     | > avg_log_mle:[92m -0.29801 [0m(-0.02001)
     | > avg_loss_dur:[92m 0.71287 [0m(-0.01411)


[4m[1m > EPOCH: 759/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:22:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.46157 [0m(+0.04671)
     | > avg_log_mle:[92m -0.31347 [0m(-0.01546)
     | > avg_loss_dur:[91m 0.77504 [0m(+0.06217)


[4m[1m > EPOCH: 760/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:22:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.36366 [0m(-0.09791)
     | > avg_log_mle:[91m -0.30505 [0m(+0.00842)
     | > avg_loss_dur:[92m 0.66871 [0m(-0.10633)


[4m[1m > EPOCH: 761/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:22:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.43763 [0m(+0.07397)
     | > avg_log_mle:[92m -0.31042 [0m(-0.00536)
     | > avg_loss_dur:[91m 0.74805 [0m(+0.07934)


[4m[1m > EPOCH: 762/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:22:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.40947 [0m(-0.02816)
     | > avg_log_mle:[92m -0.32567 [0m(-0.01526)
     | > avg_loss_dur:[92m 0.73514 [0m(-0.01291)


[4m[1m > EPOCH: 763/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:22:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.47802 [0m(+0.06855)
     | > avg_log_mle:[91m -0.30684 [0m(+0.01884)
     | > avg_loss_dur:[91m 0.78485 [0m(+0.04971)


[4m[1m > EPOCH: 764/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:22:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.36997 [0m(-0.10805)
     | > avg_log_mle:[92m -0.30686 [0m(-0.00002)
     | > avg_loss_dur:[92m 0.67683 [0m(-0.10803)


[4m[1m > EPOCH: 765/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:23:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.39645 [0m(+0.02648)
     | > avg_log_mle:[91m -0.30595 [0m(+0.00091)
     | > avg_loss_dur:[91m 0.70240 [0m(+0.02557)


[4m[1m > EPOCH: 766/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:23:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2300[0m
     | > loss: -0.53408  (-0.37499)
     | > log_mle: -0.74544  (-0.61556)
     | > loss_dur: 0.21136  (0.24057)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 19.14081  (21.75130)
     | > current_lr: 0.00019 
     | > step_time: 0.40240  (0.71665)
     | > loader_time: 0.11210  (0.26824)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.35873 [0m(-0.03771)
     | > avg_log_mle:[91m -0.29899 [0m(+0.00696)
     | > avg_loss_dur:[92m 0.65772 [0m(-0.04467)


[4m[1m > EPOCH: 767/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:23:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.33362 [0m(-0.02511)
     | > avg_log_mle:[92m -0.30198 [0m(-0.00299)
     | > avg_loss_dur:[92m 0.63560 [0m(-0.02212)


[4m[1m > EPOCH: 768/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:23:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.35341 [0m(+0.01978)
     | > avg_log_mle:[91m -0.29434 [0m(+0.00764)
     | > avg_loss_dur:[91m 0.64775 [0m(+0.01215)


[4m[1m > EPOCH: 769/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:23:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.40055 [0m(+0.04714)
     | > avg_log_mle:[92m -0.30321 [0m(-0.00887)
     | > avg_loss_dur:[91m 0.70376 [0m(+0.05602)


[4m[1m > EPOCH: 770/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:23:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.42000 [0m(+0.01945)
     | > avg_log_mle:[91m -0.29623 [0m(+0.00699)
     | > avg_loss_dur:[91m 0.71623 [0m(+0.01246)


[4m[1m > EPOCH: 771/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:23:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.45899 [0m(+0.03898)
     | > avg_log_mle:[91m -0.28963 [0m(+0.00659)
     | > avg_loss_dur:[91m 0.74862 [0m(+0.03239)


[4m[1m > EPOCH: 772/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:24:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.43533 [0m(-0.02366)
     | > avg_log_mle:[92m -0.29874 [0m(-0.00911)
     | > avg_loss_dur:[92m 0.73407 [0m(-0.01455)


[4m[1m > EPOCH: 773/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:24:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.41059 [0m(-0.02474)
     | > avg_log_mle:[91m -0.29308 [0m(+0.00566)
     | > avg_loss_dur:[92m 0.70367 [0m(-0.03040)


[4m[1m > EPOCH: 774/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:24:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.42799 [0m(+0.01740)
     | > avg_log_mle:[91m -0.28388 [0m(+0.00919)
     | > avg_loss_dur:[91m 0.71188 [0m(+0.00821)


[4m[1m > EPOCH: 775/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:24:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2325[0m
     | > loss: -0.37144  (-0.37144)
     | > log_mle: -0.59145  (-0.59145)
     | > loss_dur: 0.22001  (0.22001)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 26.50136  (26.50136)
     | > current_lr: 0.00019 
     | > step_time: 0.91080  (0.91083)
     | > loader_time: 0.33830  (0.33831)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.43628 [0m(+0.00829)
     | > avg_log_mle:[92m -0.29666 [0m(-0.01278)
     | > avg_loss_dur:[91m 0.73294 [0m(+0.02107)


[4m[1m > EPOCH: 776/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:24:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.36559 [0m(-0.07069)
     | > avg_log_mle:[91m -0.28443 [0m(+0.01223)
     | > avg_loss_dur:[92m 0.65002 [0m(-0.08293)


[4m[1m > EPOCH: 777/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:24:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.46450 [0m(+0.09892)
     | > avg_log_mle:[92m -0.28511 [0m(-0.00068)
     | > avg_loss_dur:[91m 0.74961 [0m(+0.09959)


[4m[1m > EPOCH: 778/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:25:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.42685 [0m(-0.03765)
     | > avg_log_mle:[91m -0.27837 [0m(+0.00673)
     | > avg_loss_dur:[92m 0.70523 [0m(-0.04438)


[4m[1m > EPOCH: 779/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:25:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.42579 [0m(-0.00106)
     | > avg_log_mle:[92m -0.28664 [0m(-0.00827)
     | > avg_loss_dur:[91m 0.71244 [0m(+0.00721)


[4m[1m > EPOCH: 780/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:25:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.39003 [0m(-0.03576)
     | > avg_log_mle:[91m -0.28189 [0m(+0.00475)
     | > avg_loss_dur:[92m 0.67193 [0m(-0.04051)


[4m[1m > EPOCH: 781/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:25:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00801 [0m(+0.00000)
     | > avg_loss:[91m 0.48351 [0m(+0.09348)
     | > avg_log_mle:[92m -0.28223 [0m(-0.00034)
     | > avg_loss_dur:[91m 0.76574 [0m(+0.09381)


[4m[1m > EPOCH: 782/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:25:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[92m 0.43262 [0m(-0.05089)
     | > avg_log_mle:[91m -0.27548 [0m(+0.00675)
     | > avg_loss_dur:[92m 0.70810 [0m(-0.05764)


[4m[1m > EPOCH: 783/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:25:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2350[0m
     | > loss: -0.26575  (-0.26575)
     | > log_mle: -0.52403  (-0.52403)
     | > loss_dur: 0.25828  (0.25828)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 23.46412  (23.46412)
     | > current_lr: 0.00020 
     | > step_time: 1.03800  (1.03796)
     | > loader_time: 0.42340  (0.42338)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[92m 0.41535 [0m(-0.01727)
     | > avg_log_mle:[92m -0.27946 [0m(-0.00398)
     | > avg_loss_dur:[92m 0.69481 [0m(-0.01329)


[4m[1m > EPOCH: 784/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:25:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.49673 [0m(+0.08139)
     | > avg_log_mle:[91m -0.21101 [0m(+0.06846)
     | > avg_loss_dur:[91m 0.70774 [0m(+0.01293)


[4m[1m > EPOCH: 785/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:26:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.64931 [0m(+0.15258)
     | > avg_log_mle:[91m -0.10458 [0m(+0.10642)
     | > avg_loss_dur:[91m 0.75390 [0m(+0.04616)


[4m[1m > EPOCH: 786/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:26:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.51529 [0m(-0.13402)
     | > avg_log_mle:[92m -0.21654 [0m(-0.11196)
     | > avg_loss_dur:[92m 0.73183 [0m(-0.02206)


[4m[1m > EPOCH: 787/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:26:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.41061 [0m(-0.10468)
     | > avg_log_mle:[92m -0.27481 [0m(-0.05827)
     | > avg_loss_dur:[92m 0.68542 [0m(-0.04641)


[4m[1m > EPOCH: 788/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:26:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.49707 [0m(+0.08645)
     | > avg_log_mle:[91m -0.24615 [0m(+0.02866)
     | > avg_loss_dur:[91m 0.74321 [0m(+0.05779)


[4m[1m > EPOCH: 789/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:26:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.40108 [0m(-0.09599)
     | > avg_log_mle:[92m -0.28706 [0m(-0.04092)
     | > avg_loss_dur:[92m 0.68814 [0m(-0.05507)


[4m[1m > EPOCH: 790/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:26:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.43349 [0m(+0.03241)
     | > avg_log_mle:[91m -0.27710 [0m(+0.00996)
     | > avg_loss_dur:[91m 0.71058 [0m(+0.02245)


[4m[1m > EPOCH: 791/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:27:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2375[0m
     | > loss: -0.58138  (-0.41627)
     | > log_mle: -0.75970  (-0.63452)
     | > loss_dur: 0.17831  (0.21825)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 28.06658  (29.43142)
     | > current_lr: 0.00020 
     | > step_time: 0.40440  (0.71865)
     | > loader_time: 0.10110  (0.25723)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.41496 [0m(-0.01852)
     | > avg_log_mle:[91m -0.24569 [0m(+0.03141)
     | > avg_loss_dur:[92m 0.66065 [0m(-0.04993)


[4m[1m > EPOCH: 792/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:27:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.46744 [0m(+0.05248)
     | > avg_log_mle:[92m -0.26607 [0m(-0.02038)
     | > avg_loss_dur:[91m 0.73352 [0m(+0.07286)


[4m[1m > EPOCH: 793/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:27:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.40285 [0m(-0.06459)
     | > avg_log_mle:[92m -0.28019 [0m(-0.01412)
     | > avg_loss_dur:[92m 0.68304 [0m(-0.05047)


[4m[1m > EPOCH: 794/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:27:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.38209 [0m(-0.02076)
     | > avg_log_mle:[91m -0.27277 [0m(+0.00742)
     | > avg_loss_dur:[92m 0.65486 [0m(-0.02818)


[4m[1m > EPOCH: 795/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:27:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[91m 0.41951 [0m(+0.03742)
     | > avg_log_mle:[92m -0.27686 [0m(-0.00409)
     | > avg_loss_dur:[91m 0.69637 [0m(+0.04151)


[4m[1m > EPOCH: 796/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:27:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.46633 [0m(+0.04682)
     | > avg_log_mle:[92m -0.28133 [0m(-0.00447)
     | > avg_loss_dur:[91m 0.74767 [0m(+0.05129)


[4m[1m > EPOCH: 797/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:27:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.42477 [0m(-0.04157)
     | > avg_log_mle:[91m -0.27212 [0m(+0.00922)
     | > avg_loss_dur:[92m 0.69688 [0m(-0.05078)


[4m[1m > EPOCH: 798/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:28:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.42766 [0m(+0.00290)
     | > avg_log_mle:[92m -0.28237 [0m(-0.01025)
     | > avg_loss_dur:[91m 0.71003 [0m(+0.01315)


[4m[1m > EPOCH: 799/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:28:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.39989 [0m(-0.02777)
     | > avg_log_mle:[92m -0.28726 [0m(-0.00489)
     | > avg_loss_dur:[92m 0.68715 [0m(-0.02288)


[4m[1m > EPOCH: 800/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:28:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2400[0m
     | > loss: -0.40104  (-0.40104)
     | > log_mle: -0.60908  (-0.60908)
     | > loss_dur: 0.20805  (0.20805)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 22.08398  (22.08398)
     | > current_lr: 0.00020 
     | > step_time: 0.80870  (0.80873)
     | > loader_time: 0.31230  (0.31228)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.41283 [0m(+0.01294)
     | > avg_log_mle:[91m -0.27684 [0m(+0.01042)
     | > avg_loss_dur:[91m 0.68967 [0m(+0.00252)


[4m[1m > EPOCH: 801/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:28:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.41829 [0m(+0.00546)
     | > avg_log_mle:[91m -0.27478 [0m(+0.00206)
     | > avg_loss_dur:[91m 0.69307 [0m(+0.00340)


[4m[1m > EPOCH: 802/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:28:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.41404 [0m(-0.00425)
     | > avg_log_mle:[92m -0.27685 [0m(-0.00207)
     | > avg_loss_dur:[92m 0.69089 [0m(-0.00218)


[4m[1m > EPOCH: 803/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:28:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.48947 [0m(+0.07543)
     | > avg_log_mle:[91m -0.27094 [0m(+0.00591)
     | > avg_loss_dur:[91m 0.76040 [0m(+0.06951)


[4m[1m > EPOCH: 804/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:29:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.53769 [0m(+0.04822)
     | > avg_log_mle:[91m -0.24531 [0m(+0.02562)
     | > avg_loss_dur:[91m 0.78300 [0m(+0.02260)


[4m[1m > EPOCH: 805/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:29:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.51241 [0m(-0.02528)
     | > avg_log_mle:[92m -0.26382 [0m(-0.01851)
     | > avg_loss_dur:[92m 0.77623 [0m(-0.00677)


[4m[1m > EPOCH: 806/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:29:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[92m 0.49693 [0m(-0.01549)
     | > avg_log_mle:[91m -0.26175 [0m(+0.00207)
     | > avg_loss_dur:[92m 0.75868 [0m(-0.01756)


[4m[1m > EPOCH: 807/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:29:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.45162 [0m(-0.04531)
     | > avg_log_mle:[91m -0.25956 [0m(+0.00220)
     | > avg_loss_dur:[92m 0.71117 [0m(-0.04750)


[4m[1m > EPOCH: 808/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:29:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2425[0m
     | > loss: -0.29177  (-0.29177)
     | > log_mle: -0.53513  (-0.53513)
     | > loss_dur: 0.24336  (0.24336)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 33.59172  (33.59172)
     | > current_lr: 0.00020 
     | > step_time: 1.03500  (1.03495)
     | > loader_time: 0.41840  (0.41838)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.45826 [0m(+0.00665)
     | > avg_log_mle:[92m -0.26943 [0m(-0.00987)
     | > avg_loss_dur:[91m 0.72769 [0m(+0.01652)


[4m[1m > EPOCH: 809/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:29:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.43048 [0m(-0.02779)
     | > avg_log_mle:[91m -0.26853 [0m(+0.00089)
     | > avg_loss_dur:[92m 0.69901 [0m(-0.02868)


[4m[1m > EPOCH: 810/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:29:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.50267 [0m(+0.07219)
     | > avg_log_mle:[92m -0.27244 [0m(-0.00391)
     | > avg_loss_dur:[91m 0.77511 [0m(+0.07610)


[4m[1m > EPOCH: 811/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:30:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.45397 [0m(-0.04870)
     | > avg_log_mle:[91m -0.25201 [0m(+0.02043)
     | > avg_loss_dur:[92m 0.70598 [0m(-0.06913)


[4m[1m > EPOCH: 812/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:30:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.44069 [0m(-0.01328)
     | > avg_log_mle:[92m -0.25779 [0m(-0.00577)
     | > avg_loss_dur:[92m 0.69848 [0m(-0.00750)


[4m[1m > EPOCH: 813/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:30:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.47999 [0m(+0.03930)
     | > avg_log_mle:[92m -0.26436 [0m(-0.00657)
     | > avg_loss_dur:[91m 0.74435 [0m(+0.04587)


[4m[1m > EPOCH: 814/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:30:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.48228 [0m(+0.00228)
     | > avg_log_mle:[92m -0.27040 [0m(-0.00604)
     | > avg_loss_dur:[91m 0.75268 [0m(+0.00833)


[4m[1m > EPOCH: 815/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:30:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.50992 [0m(+0.02764)
     | > avg_log_mle:[91m -0.25397 [0m(+0.01643)
     | > avg_loss_dur:[91m 0.76390 [0m(+0.01121)


[4m[1m > EPOCH: 816/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:30:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2450[0m
     | > loss: -0.67060  (-0.48940)
     | > log_mle: -0.82285  (-0.68573)
     | > loss_dur: 0.15225  (0.19633)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 30.58021  (40.91590)
     | > current_lr: 0.00020 
     | > step_time: 0.39940  (0.71765)
     | > loader_time: 0.10010  (0.26024)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.46962 [0m(-0.04030)
     | > avg_log_mle:[92m -0.26933 [0m(-0.01536)
     | > avg_loss_dur:[92m 0.73896 [0m(-0.02494)


[4m[1m > EPOCH: 817/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:31:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.51470 [0m(+0.04508)
     | > avg_log_mle:[91m -0.24092 [0m(+0.02842)
     | > avg_loss_dur:[91m 0.75562 [0m(+0.01666)


[4m[1m > EPOCH: 818/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:31:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.43036 [0m(-0.08434)
     | > avg_log_mle:[92m -0.25331 [0m(-0.01239)
     | > avg_loss_dur:[92m 0.68367 [0m(-0.07195)


[4m[1m > EPOCH: 819/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:31:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.46072 [0m(+0.03036)
     | > avg_log_mle:[91m -0.24693 [0m(+0.00638)
     | > avg_loss_dur:[91m 0.70765 [0m(+0.02397)


[4m[1m > EPOCH: 820/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:31:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.46377 [0m(+0.00305)
     | > avg_log_mle:[92m -0.25147 [0m(-0.00455)
     | > avg_loss_dur:[91m 0.71524 [0m(+0.00759)


[4m[1m > EPOCH: 821/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:31:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.47428 [0m(+0.01052)
     | > avg_log_mle:[91m -0.24801 [0m(+0.00346)
     | > avg_loss_dur:[91m 0.72229 [0m(+0.00705)


[4m[1m > EPOCH: 822/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:31:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.48056 [0m(+0.00627)
     | > avg_log_mle:[92m -0.25505 [0m(-0.00704)
     | > avg_loss_dur:[91m 0.73560 [0m(+0.01331)


[4m[1m > EPOCH: 823/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:32:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.52007 [0m(+0.03951)
     | > avg_log_mle:[91m -0.24896 [0m(+0.00609)
     | > avg_loss_dur:[91m 0.76903 [0m(+0.03343)


[4m[1m > EPOCH: 824/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:32:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.47804 [0m(-0.04204)
     | > avg_log_mle:[91m -0.24186 [0m(+0.00711)
     | > avg_loss_dur:[92m 0.71989 [0m(-0.04914)


[4m[1m > EPOCH: 825/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:32:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2475[0m
     | > loss: -0.42434  (-0.42434)
     | > log_mle: -0.62318  (-0.62318)
     | > loss_dur: 0.19884  (0.19884)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 49.78447  (49.78447)
     | > current_lr: 0.00021 
     | > step_time: 0.86380  (0.86379)
     | > loader_time: 0.53050  (0.53048)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.44799 [0m(-0.03004)
     | > avg_log_mle:[92m -0.25556 [0m(-0.01371)
     | > avg_loss_dur:[92m 0.70355 [0m(-0.01634)


[4m[1m > EPOCH: 826/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:32:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.45802 [0m(+0.01002)
     | > avg_log_mle:[92m -0.25676 [0m(-0.00119)
     | > avg_loss_dur:[91m 0.71477 [0m(+0.01122)


[4m[1m > EPOCH: 827/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:32:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.49264 [0m(+0.03462)
     | > avg_log_mle:[91m -0.24236 [0m(+0.01439)
     | > avg_loss_dur:[91m 0.73500 [0m(+0.02023)


[4m[1m > EPOCH: 828/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:32:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.46103 [0m(-0.03161)
     | > avg_log_mle:[92m -0.25726 [0m(-0.01490)
     | > avg_loss_dur:[92m 0.71829 [0m(-0.01671)


[4m[1m > EPOCH: 829/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:32:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.58737 [0m(+0.12634)
     | > avg_log_mle:[91m -0.25515 [0m(+0.00211)
     | > avg_loss_dur:[91m 0.84252 [0m(+0.12423)


[4m[1m > EPOCH: 830/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:33:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00300)
     | > avg_loss:[92m 0.52254 [0m(-0.06483)
     | > avg_log_mle:[91m -0.21469 [0m(+0.04046)
     | > avg_loss_dur:[92m 0.73722 [0m(-0.10530)


[4m[1m > EPOCH: 831/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:33:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00300)
     | > avg_loss:[92m 0.44648 [0m(-0.07605)
     | > avg_log_mle:[92m -0.25470 [0m(-0.04001)
     | > avg_loss_dur:[92m 0.70118 [0m(-0.03604)


[4m[1m > EPOCH: 832/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:33:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.49520 [0m(+0.04871)
     | > avg_log_mle:[91m -0.22754 [0m(+0.02716)
     | > avg_loss_dur:[91m 0.72273 [0m(+0.02155)


[4m[1m > EPOCH: 833/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:33:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2500[0m
     | > loss: -0.30774  (-0.30774)
     | > log_mle: -0.54409  (-0.54409)
     | > loss_dur: 0.23635  (0.23635)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 72.20256  (72.20256)
     | > current_lr: 0.00021 
     | > step_time: 1.02990  (1.02994)
     | > loader_time: 0.41840  (0.41837)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.46578 [0m(-0.02942)
     | > avg_log_mle:[92m -0.24375 [0m(-0.01621)
     | > avg_loss_dur:[92m 0.70952 [0m(-0.01321)


[4m[1m > EPOCH: 834/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:33:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.56713 [0m(+0.10135)
     | > avg_log_mle:[91m -0.23710 [0m(+0.00664)
     | > avg_loss_dur:[91m 0.80423 [0m(+0.09471)


[4m[1m > EPOCH: 835/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:33:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.50002 [0m(-0.06711)
     | > avg_log_mle:[91m -0.23424 [0m(+0.00286)
     | > avg_loss_dur:[92m 0.73426 [0m(-0.06997)


[4m[1m > EPOCH: 836/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:34:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.56672 [0m(+0.06670)
     | > avg_log_mle:[91m -0.23089 [0m(+0.00335)
     | > avg_loss_dur:[91m 0.79761 [0m(+0.06335)


[4m[1m > EPOCH: 837/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:34:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.49210 [0m(-0.07462)
     | > avg_log_mle:[92m -0.23771 [0m(-0.00682)
     | > avg_loss_dur:[92m 0.72982 [0m(-0.06780)


[4m[1m > EPOCH: 838/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:34:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.47411 [0m(-0.01799)
     | > avg_log_mle:[91m -0.23666 [0m(+0.00105)
     | > avg_loss_dur:[92m 0.71077 [0m(-0.01904)


[4m[1m > EPOCH: 839/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:34:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.50317 [0m(+0.02906)
     | > avg_log_mle:[91m -0.22564 [0m(+0.01102)
     | > avg_loss_dur:[91m 0.72881 [0m(+0.01804)


[4m[1m > EPOCH: 840/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:34:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.57642 [0m(+0.07325)
     | > avg_log_mle:[91m -0.21029 [0m(+0.01535)
     | > avg_loss_dur:[91m 0.78671 [0m(+0.05790)


[4m[1m > EPOCH: 841/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:34:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2525[0m
     | > loss: -0.71175  (-0.51082)
     | > log_mle: -0.85296  (-0.69931)
     | > loss_dur: 0.14121  (0.18850)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 42.52645  (38.76015)
     | > current_lr: 0.00021 
     | > step_time: 0.40140  (0.72066)
     | > loader_time: 0.10310  (0.26074)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.64741 [0m(+0.07099)
     | > avg_log_mle:[92m -0.22213 [0m(-0.01184)
     | > avg_loss_dur:[91m 0.86954 [0m(+0.08283)


[4m[1m > EPOCH: 842/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:34:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.56587 [0m(-0.08154)
     | > avg_log_mle:[92m -0.25234 [0m(-0.03021)
     | > avg_loss_dur:[92m 0.81821 [0m(-0.05133)


[4m[1m > EPOCH: 843/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:35:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.55350 [0m(-0.01237)
     | > avg_log_mle:[91m -0.23503 [0m(+0.01731)
     | > avg_loss_dur:[92m 0.78854 [0m(-0.02967)


[4m[1m > EPOCH: 844/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:35:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.52397 [0m(-0.02953)
     | > avg_log_mle:[92m -0.24271 [0m(-0.00768)
     | > avg_loss_dur:[92m 0.76668 [0m(-0.02185)


[4m[1m > EPOCH: 845/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:35:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.53635 [0m(+0.01238)
     | > avg_log_mle:[91m -0.22389 [0m(+0.01882)
     | > avg_loss_dur:[92m 0.76025 [0m(-0.00644)


[4m[1m > EPOCH: 846/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:35:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[91m 0.63579 [0m(+0.09943)
     | > avg_log_mle:[92m -0.23264 [0m(-0.00875)
     | > avg_loss_dur:[91m 0.86843 [0m(+0.10818)


[4m[1m > EPOCH: 847/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:35:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.55922 [0m(-0.07657)
     | > avg_log_mle:[91m -0.22359 [0m(+0.00905)
     | > avg_loss_dur:[92m 0.78281 [0m(-0.08562)


[4m[1m > EPOCH: 848/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:35:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.52182 [0m(-0.03740)
     | > avg_log_mle:[92m -0.22640 [0m(-0.00281)
     | > avg_loss_dur:[92m 0.74822 [0m(-0.03459)


[4m[1m > EPOCH: 849/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:36:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.49973 [0m(-0.02208)
     | > avg_log_mle:[92m -0.22672 [0m(-0.00032)
     | > avg_loss_dur:[92m 0.72645 [0m(-0.02176)


[4m[1m > EPOCH: 850/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:36:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2550[0m
     | > loss: -0.47669  (-0.47669)
     | > log_mle: -0.65811  (-0.65811)
     | > loss_dur: 0.18142  (0.18142)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 41.88476  (41.88476)
     | > current_lr: 0.00021 
     | > step_time: 0.81880  (0.81876)
     | > loader_time: 0.33130  (0.33130)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[91m 0.50088 [0m(+0.00115)
     | > avg_log_mle:[91m -0.22376 [0m(+0.00296)
     | > avg_loss_dur:[92m 0.72464 [0m(-0.00181)


[4m[1m > EPOCH: 851/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:36:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.51878 [0m(+0.01790)
     | > avg_log_mle:[92m -0.22489 [0m(-0.00113)
     | > avg_loss_dur:[91m 0.74368 [0m(+0.01904)


[4m[1m > EPOCH: 852/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:36:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.58560 [0m(+0.06682)
     | > avg_log_mle:[91m -0.21729 [0m(+0.00761)
     | > avg_loss_dur:[91m 0.80289 [0m(+0.05921)


[4m[1m > EPOCH: 853/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:36:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.56372 [0m(-0.02188)
     | > avg_log_mle:[91m -0.21550 [0m(+0.00178)
     | > avg_loss_dur:[92m 0.77922 [0m(-0.02367)


[4m[1m > EPOCH: 854/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:36:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.63606 [0m(+0.07234)
     | > avg_log_mle:[91m -0.20787 [0m(+0.00763)
     | > avg_loss_dur:[91m 0.84393 [0m(+0.06471)


[4m[1m > EPOCH: 855/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:36:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.58598 [0m(-0.05008)
     | > avg_log_mle:[91m -0.18581 [0m(+0.02206)
     | > avg_loss_dur:[92m 0.77180 [0m(-0.07214)


[4m[1m > EPOCH: 856/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:37:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00000)
     | > avg_loss:[92m 0.55312 [0m(-0.03286)
     | > avg_log_mle:[92m -0.22215 [0m(-0.03633)
     | > avg_loss_dur:[91m 0.77527 [0m(+0.00347)


[4m[1m > EPOCH: 857/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:37:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.65159 [0m(+0.09847)
     | > avg_log_mle:[91m -0.12345 [0m(+0.09870)
     | > avg_loss_dur:[92m 0.77504 [0m(-0.00023)


[4m[1m > EPOCH: 858/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:37:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2575[0m
     | > loss: -0.22908  (-0.22908)
     | > log_mle: -0.47253  (-0.47253)
     | > loss_dur: 0.24345  (0.24345)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 23.78535  (23.78535)
     | > current_lr: 0.00021 
     | > step_time: 1.02990  (1.02994)
     | > loader_time: 0.41640  (0.41638)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.55219 [0m(-0.09940)
     | > avg_log_mle:[92m -0.28021 [0m(-0.15676)
     | > avg_loss_dur:[91m 0.83240 [0m(+0.05736)


[4m[1m > EPOCH: 859/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:37:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.48681 [0m(-0.06538)
     | > avg_log_mle:[91m -0.24369 [0m(+0.03652)
     | > avg_loss_dur:[92m 0.73051 [0m(-0.10190)


[4m[1m > EPOCH: 860/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:37:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.49030 [0m(+0.00349)
     | > avg_log_mle:[92m -0.25750 [0m(-0.01381)
     | > avg_loss_dur:[91m 0.74780 [0m(+0.01729)


[4m[1m > EPOCH: 861/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:37:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[91m 0.62339 [0m(+0.13309)
     | > avg_log_mle:[91m -0.21026 [0m(+0.04725)
     | > avg_loss_dur:[91m 0.83365 [0m(+0.08585)


[4m[1m > EPOCH: 862/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:38:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.53015 [0m(-0.09324)
     | > avg_log_mle:[92m -0.23148 [0m(-0.02122)
     | > avg_loss_dur:[92m 0.76163 [0m(-0.07202)


[4m[1m > EPOCH: 863/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:38:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.48559 [0m(-0.04457)
     | > avg_log_mle:[92m -0.25915 [0m(-0.02767)
     | > avg_loss_dur:[92m 0.74474 [0m(-0.01690)


[4m[1m > EPOCH: 864/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:38:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.54999 [0m(+0.06440)
     | > avg_log_mle:[91m -0.20301 [0m(+0.05614)
     | > avg_loss_dur:[91m 0.75300 [0m(+0.00827)


[4m[1m > EPOCH: 865/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:38:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.62654 [0m(+0.07655)
     | > avg_log_mle:[92m -0.21179 [0m(-0.00878)
     | > avg_loss_dur:[91m 0.83833 [0m(+0.08533)


[4m[1m > EPOCH: 866/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:38:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2600[0m
     | > loss: -0.63337  (-0.44050)
     | > log_mle: -0.78171  (-0.64100)
     | > loss_dur: 0.14834  (0.20050)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 27.25292  (29.30665)
     | > current_lr: 0.00022 
     | > step_time: 0.40040  (0.71865)
     | > loader_time: 0.10310  (0.26274)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.44435 [0m(-0.18219)
     | > avg_log_mle:[92m -0.23797 [0m(-0.02618)
     | > avg_loss_dur:[92m 0.68231 [0m(-0.15602)


[4m[1m > EPOCH: 867/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:38:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.54317 [0m(+0.09883)
     | > avg_log_mle:[92m -0.24813 [0m(-0.01016)
     | > avg_loss_dur:[91m 0.79130 [0m(+0.10899)


[4m[1m > EPOCH: 868/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:38:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.47569 [0m(-0.06748)
     | > avg_log_mle:[92m -0.25253 [0m(-0.00440)
     | > avg_loss_dur:[92m 0.72822 [0m(-0.06308)


[4m[1m > EPOCH: 869/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:39:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.57175 [0m(+0.09605)
     | > avg_log_mle:[91m -0.20973 [0m(+0.04280)
     | > avg_loss_dur:[91m 0.78148 [0m(+0.05325)


[4m[1m > EPOCH: 870/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:39:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.49291 [0m(-0.07884)
     | > avg_log_mle:[91m -0.20869 [0m(+0.00104)
     | > avg_loss_dur:[92m 0.70160 [0m(-0.07988)


[4m[1m > EPOCH: 871/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:39:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.51634 [0m(+0.02343)
     | > avg_log_mle:[92m -0.21712 [0m(-0.00843)
     | > avg_loss_dur:[91m 0.73346 [0m(+0.03186)


[4m[1m > EPOCH: 872/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:39:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.60223 [0m(+0.08589)
     | > avg_log_mle:[92m -0.21973 [0m(-0.00261)
     | > avg_loss_dur:[91m 0.82196 [0m(+0.08851)


[4m[1m > EPOCH: 873/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:39:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.52752 [0m(-0.07471)
     | > avg_log_mle:[91m -0.20753 [0m(+0.01220)
     | > avg_loss_dur:[92m 0.73506 [0m(-0.08691)


[4m[1m > EPOCH: 874/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:39:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.63024 [0m(+0.10271)
     | > avg_log_mle:[92m -0.22482 [0m(-0.01728)
     | > avg_loss_dur:[91m 0.85505 [0m(+0.12000)


[4m[1m > EPOCH: 875/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:40:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2625[0m
     | > loss: -0.44753  (-0.44753)
     | > log_mle: -0.63281  (-0.63281)
     | > loss_dur: 0.18528  (0.18528)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 22.03943  (22.03943)
     | > current_lr: 0.00022 
     | > step_time: 0.72270  (0.72266)
     | > loader_time: 0.31930  (0.31929)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.63920 [0m(+0.00896)
     | > avg_log_mle:[91m -0.22400 [0m(+0.00081)
     | > avg_loss_dur:[91m 0.86320 [0m(+0.00815)


[4m[1m > EPOCH: 876/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:40:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.54353 [0m(-0.09567)
     | > avg_log_mle:[91m -0.22160 [0m(+0.00240)
     | > avg_loss_dur:[92m 0.76513 [0m(-0.09807)


[4m[1m > EPOCH: 877/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:40:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.51306 [0m(-0.03047)
     | > avg_log_mle:[91m -0.22059 [0m(+0.00101)
     | > avg_loss_dur:[92m 0.73365 [0m(-0.03148)


[4m[1m > EPOCH: 878/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:40:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.51652 [0m(+0.00346)
     | > avg_log_mle:[91m -0.20081 [0m(+0.01978)
     | > avg_loss_dur:[92m 0.71734 [0m(-0.01632)


[4m[1m > EPOCH: 879/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:40:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.58133 [0m(+0.06480)
     | > avg_log_mle:[92m -0.24842 [0m(-0.04761)
     | > avg_loss_dur:[91m 0.82975 [0m(+0.11242)


[4m[1m > EPOCH: 880/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:40:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.55342 [0m(-0.02791)
     | > avg_log_mle:[91m -0.20798 [0m(+0.04044)
     | > avg_loss_dur:[92m 0.76140 [0m(-0.06835)


[4m[1m > EPOCH: 881/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:40:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.53322 [0m(-0.02020)
     | > avg_log_mle:[91m -0.19665 [0m(+0.01133)
     | > avg_loss_dur:[92m 0.72987 [0m(-0.03153)


[4m[1m > EPOCH: 882/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:41:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.56207 [0m(+0.02886)
     | > avg_log_mle:[92m -0.21887 [0m(-0.02222)
     | > avg_loss_dur:[91m 0.78094 [0m(+0.05107)


[4m[1m > EPOCH: 883/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:41:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2650[0m
     | > loss: -0.34705  (-0.34705)
     | > log_mle: -0.56458  (-0.56458)
     | > loss_dur: 0.21752  (0.21752)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 21.13256  (21.13256)
     | > current_lr: 0.00022 
     | > step_time: 1.03690  (1.03694)
     | > loader_time: 0.42440  (0.42437)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.55366 [0m(-0.00841)
     | > avg_log_mle:[92m -0.23573 [0m(-0.01687)
     | > avg_loss_dur:[91m 0.78939 [0m(+0.00845)


[4m[1m > EPOCH: 884/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:41:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.55596 [0m(+0.00230)
     | > avg_log_mle:[91m -0.17409 [0m(+0.06165)
     | > avg_loss_dur:[92m 0.73005 [0m(-0.05934)


[4m[1m > EPOCH: 885/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:41:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.62672 [0m(+0.07076)
     | > avg_log_mle:[92m -0.18326 [0m(-0.00917)
     | > avg_loss_dur:[91m 0.80998 [0m(+0.07993)


[4m[1m > EPOCH: 886/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:41:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.56705 [0m(-0.05967)
     | > avg_log_mle:[92m -0.21781 [0m(-0.03455)
     | > avg_loss_dur:[92m 0.78486 [0m(-0.02512)


[4m[1m > EPOCH: 887/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:41:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.59892 [0m(+0.03187)
     | > avg_log_mle:[91m -0.20861 [0m(+0.00920)
     | > avg_loss_dur:[91m 0.80753 [0m(+0.02266)


[4m[1m > EPOCH: 888/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:42:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[91m 0.62215 [0m(+0.02324)
     | > avg_log_mle:[91m -0.19333 [0m(+0.01528)
     | > avg_loss_dur:[91m 0.81549 [0m(+0.00796)


[4m[1m > EPOCH: 889/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:42:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.50796 [0m(-0.11419)
     | > avg_log_mle:[92m -0.19590 [0m(-0.00256)
     | > avg_loss_dur:[92m 0.70385 [0m(-0.11163)


[4m[1m > EPOCH: 890/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:42:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.53780 [0m(+0.02985)
     | > avg_log_mle:[92m -0.22241 [0m(-0.02651)
     | > avg_loss_dur:[91m 0.76021 [0m(+0.05636)


[4m[1m > EPOCH: 891/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:42:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2675[0m
     | > loss: -0.71134  (-0.51298)
     | > log_mle: -0.81655  (-0.67428)
     | > loss_dur: 0.10521  (0.16130)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 15.69514  (18.27440)
     | > current_lr: 0.00022 
     | > step_time: 0.40440  (0.72316)
     | > loader_time: 0.10310  (0.26273)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[91m 0.63065 [0m(+0.09285)
     | > avg_log_mle:[92m -0.22382 [0m(-0.00141)
     | > avg_loss_dur:[91m 0.85447 [0m(+0.09426)


[4m[1m > EPOCH: 892/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:42:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[92m 0.56684 [0m(-0.06381)
     | > avg_log_mle:[91m -0.20698 [0m(+0.01684)
     | > avg_loss_dur:[92m 0.77382 [0m(-0.08065)


[4m[1m > EPOCH: 893/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:42:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.57166 [0m(+0.00482)
     | > avg_log_mle:[92m -0.23192 [0m(-0.02494)
     | > avg_loss_dur:[91m 0.80358 [0m(+0.02976)


[4m[1m > EPOCH: 894/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:42:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.65161 [0m(+0.07994)
     | > avg_log_mle:[91m -0.21366 [0m(+0.01826)
     | > avg_loss_dur:[91m 0.86526 [0m(+0.06168)


[4m[1m > EPOCH: 895/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:43:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.57589 [0m(-0.07572)
     | > avg_log_mle:[91m -0.19858 [0m(+0.01507)
     | > avg_loss_dur:[92m 0.77447 [0m(-0.09079)


[4m[1m > EPOCH: 896/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:43:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.56712 [0m(-0.00877)
     | > avg_log_mle:[91m -0.19145 [0m(+0.00713)
     | > avg_loss_dur:[92m 0.75857 [0m(-0.01590)


[4m[1m > EPOCH: 897/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:43:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.61040 [0m(+0.04328)
     | > avg_log_mle:[92m -0.19876 [0m(-0.00731)
     | > avg_loss_dur:[91m 0.80917 [0m(+0.05059)


[4m[1m > EPOCH: 898/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:43:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.55437 [0m(-0.05603)
     | > avg_log_mle:[92m -0.20569 [0m(-0.00693)
     | > avg_loss_dur:[92m 0.76007 [0m(-0.04910)


[4m[1m > EPOCH: 899/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:43:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.74491 [0m(+0.19054)
     | > avg_log_mle:[91m -0.18748 [0m(+0.01822)
     | > avg_loss_dur:[91m 0.93239 [0m(+0.17232)


[4m[1m > EPOCH: 900/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:43:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2700[0m
     | > loss: -0.44781  (-0.44781)
     | > log_mle: -0.62868  (-0.62868)
     | > loss_dur: 0.18086  (0.18086)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 40.68109  (40.68109)
     | > current_lr: 0.00022 
     | > step_time: 0.72070  (0.72066)
     | > loader_time: 0.31230  (0.31228)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.67692 [0m(-0.06800)
     | > avg_log_mle:[92m -0.19554 [0m(-0.00806)
     | > avg_loss_dur:[92m 0.87245 [0m(-0.05994)


[4m[1m > EPOCH: 901/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:44:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.60024 [0m(-0.07667)
     | > avg_log_mle:[92m -0.21232 [0m(-0.01678)
     | > avg_loss_dur:[92m 0.81256 [0m(-0.05989)


[4m[1m > EPOCH: 902/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:44:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.59357 [0m(-0.00668)
     | > avg_log_mle:[91m -0.21082 [0m(+0.00149)
     | > avg_loss_dur:[92m 0.80439 [0m(-0.00817)


[4m[1m > EPOCH: 903/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:44:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.65872 [0m(+0.06515)
     | > avg_log_mle:[91m -0.19018 [0m(+0.02064)
     | > avg_loss_dur:[91m 0.84890 [0m(+0.04451)


[4m[1m > EPOCH: 904/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:44:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.59305 [0m(-0.06567)
     | > avg_log_mle:[91m -0.17573 [0m(+0.01446)
     | > avg_loss_dur:[92m 0.76878 [0m(-0.08013)


[4m[1m > EPOCH: 905/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:44:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.65770 [0m(+0.06465)
     | > avg_log_mle:[92m -0.19042 [0m(-0.01469)
     | > avg_loss_dur:[91m 0.84812 [0m(+0.07934)


[4m[1m > EPOCH: 906/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:44:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.70847 [0m(+0.05078)
     | > avg_log_mle:[92m -0.19684 [0m(-0.00642)
     | > avg_loss_dur:[91m 0.90531 [0m(+0.05720)


[4m[1m > EPOCH: 907/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:45:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.62459 [0m(-0.08389)
     | > avg_log_mle:[92m -0.19704 [0m(-0.00020)
     | > avg_loss_dur:[92m 0.82163 [0m(-0.08368)


[4m[1m > EPOCH: 908/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:45:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2725[0m
     | > loss: -0.39661  (-0.39661)
     | > log_mle: -0.59762  (-0.59762)
     | > loss_dur: 0.20101  (0.20101)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 24.13079  (24.13079)
     | > current_lr: 0.00023 
     | > step_time: 1.04500  (1.04496)
     | > loader_time: 0.41640  (0.41637)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.67667 [0m(+0.05208)
     | > avg_log_mle:[91m -0.17007 [0m(+0.02698)
     | > avg_loss_dur:[91m 0.84674 [0m(+0.02511)


[4m[1m > EPOCH: 909/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:45:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.71852 [0m(+0.04184)
     | > avg_log_mle:[91m -0.15723 [0m(+0.01284)
     | > avg_loss_dur:[91m 0.87575 [0m(+0.02901)


[4m[1m > EPOCH: 910/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:45:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00801 [0m(+0.00000)
     | > avg_loss:[92m 0.69495 [0m(-0.02356)
     | > avg_log_mle:[92m -0.17894 [0m(-0.02171)
     | > avg_loss_dur:[92m 0.87390 [0m(-0.00185)


[4m[1m > EPOCH: 911/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:45:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.68247 [0m(-0.01248)
     | > avg_log_mle:[92m -0.19985 [0m(-0.02090)
     | > avg_loss_dur:[91m 0.88232 [0m(+0.00842)


[4m[1m > EPOCH: 912/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:45:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.68300 [0m(+0.00052)
     | > avg_log_mle:[91m -0.18030 [0m(+0.01955)
     | > avg_loss_dur:[92m 0.86330 [0m(-0.01902)


[4m[1m > EPOCH: 913/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:45:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.60677 [0m(-0.07623)
     | > avg_log_mle:[91m -0.17238 [0m(+0.00792)
     | > avg_loss_dur:[92m 0.77915 [0m(-0.08415)


[4m[1m > EPOCH: 914/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:46:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.62549 [0m(+0.01873)
     | > avg_log_mle:[91m -0.16496 [0m(+0.00742)
     | > avg_loss_dur:[91m 0.79045 [0m(+0.01130)


[4m[1m > EPOCH: 915/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:46:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.72583 [0m(+0.10034)
     | > avg_log_mle:[92m -0.17237 [0m(-0.00741)
     | > avg_loss_dur:[91m 0.89820 [0m(+0.10775)


[4m[1m > EPOCH: 916/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:46:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2750[0m
     | > loss: -0.88015  (-0.64529)
     | > log_mle: -0.95557  (-0.77752)
     | > loss_dur: 0.07542  (0.13223)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 49.69785  (34.17176)
     | > current_lr: 0.00023 
     | > step_time: 0.40140  (0.72066)
     | > loader_time: 0.10410  (0.26122)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.70722 [0m(-0.01861)
     | > avg_log_mle:[91m -0.15975 [0m(+0.01262)
     | > avg_loss_dur:[92m 0.86697 [0m(-0.03123)


[4m[1m > EPOCH: 917/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:46:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[92m 0.69092 [0m(-0.01630)
     | > avg_log_mle:[92m -0.17037 [0m(-0.01063)
     | > avg_loss_dur:[92m 0.86129 [0m(-0.00568)


[4m[1m > EPOCH: 918/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:46:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.67569 [0m(-0.01522)
     | > avg_log_mle:[91m -0.15884 [0m(+0.01154)
     | > avg_loss_dur:[92m 0.83453 [0m(-0.02676)


[4m[1m > EPOCH: 919/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:46:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.74088 [0m(+0.06519)
     | > avg_log_mle:[92m -0.17867 [0m(-0.01984)
     | > avg_loss_dur:[91m 0.91955 [0m(+0.08503)


[4m[1m > EPOCH: 920/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:47:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.73453 [0m(-0.00635)
     | > avg_log_mle:[91m -0.17222 [0m(+0.00645)
     | > avg_loss_dur:[92m 0.90675 [0m(-0.01280)


[4m[1m > EPOCH: 921/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:47:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.69356 [0m(-0.04097)
     | > avg_log_mle:[91m -0.17192 [0m(+0.00030)
     | > avg_loss_dur:[92m 0.86549 [0m(-0.04126)


[4m[1m > EPOCH: 922/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:47:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.74018 [0m(+0.04662)
     | > avg_log_mle:[91m -0.15342 [0m(+0.01850)
     | > avg_loss_dur:[91m 0.89360 [0m(+0.02811)


[4m[1m > EPOCH: 923/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:47:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.75845 [0m(+0.01827)
     | > avg_log_mle:[92m -0.17038 [0m(-0.01696)
     | > avg_loss_dur:[91m 0.92883 [0m(+0.03522)


[4m[1m > EPOCH: 924/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:47:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.75268 [0m(-0.00577)
     | > avg_log_mle:[91m -0.15571 [0m(+0.01467)
     | > avg_loss_dur:[92m 0.90839 [0m(-0.02044)


[4m[1m > EPOCH: 925/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:47:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2775[0m
     | > loss: -0.56446  (-0.56446)
     | > log_mle: -0.71023  (-0.71023)
     | > loss_dur: 0.14577  (0.14577)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 28.77640  (28.77640)
     | > current_lr: 0.00023 
     | > step_time: 0.73170  (0.73166)
     | > loader_time: 0.32830  (0.32829)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.78186 [0m(+0.02918)
     | > avg_log_mle:[91m -0.14237 [0m(+0.01334)
     | > avg_loss_dur:[91m 0.92423 [0m(+0.01584)


[4m[1m > EPOCH: 926/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:47:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.72926 [0m(-0.05260)
     | > avg_log_mle:[92m -0.16185 [0m(-0.01949)
     | > avg_loss_dur:[92m 0.89112 [0m(-0.03311)


[4m[1m > EPOCH: 927/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:48:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.68281 [0m(-0.04645)
     | > avg_log_mle:[91m -0.13396 [0m(+0.02790)
     | > avg_loss_dur:[92m 0.81677 [0m(-0.07434)


[4m[1m > EPOCH: 928/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:48:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.75122 [0m(+0.06840)
     | > avg_log_mle:[92m -0.16256 [0m(-0.02861)
     | > avg_loss_dur:[91m 0.91378 [0m(+0.09701)


[4m[1m > EPOCH: 929/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:48:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.66516 [0m(-0.08605)
     | > avg_log_mle:[91m -0.13005 [0m(+0.03251)
     | > avg_loss_dur:[92m 0.79522 [0m(-0.11856)


[4m[1m > EPOCH: 930/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:48:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.73736 [0m(+0.07219)
     | > avg_log_mle:[92m -0.16444 [0m(-0.03438)
     | > avg_loss_dur:[91m 0.90179 [0m(+0.10658)


[4m[1m > EPOCH: 931/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:48:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.72754 [0m(-0.00982)
     | > avg_log_mle:[91m -0.13935 [0m(+0.02509)
     | > avg_loss_dur:[92m 0.86688 [0m(-0.03491)


[4m[1m > EPOCH: 932/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:48:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.77227 [0m(+0.04474)
     | > avg_log_mle:[92m -0.15001 [0m(-0.01067)
     | > avg_loss_dur:[91m 0.92229 [0m(+0.05540)


[4m[1m > EPOCH: 933/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:49:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2800[0m
     | > loss: -0.44421  (-0.44421)
     | > log_mle: -0.62554  (-0.62554)
     | > loss_dur: 0.18133  (0.18133)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 41.27505  (41.27505)
     | > current_lr: 0.00023 
     | > step_time: 1.04090  (1.04095)
     | > loader_time: 0.43840  (0.43840)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.77075 [0m(-0.00152)
     | > avg_log_mle:[91m -0.13690 [0m(+0.01311)
     | > avg_loss_dur:[92m 0.90765 [0m(-0.01464)


[4m[1m > EPOCH: 934/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:49:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.01001 [0m(-0.00000)
     | > avg_loss:[92m 0.72110 [0m(-0.04966)
     | > avg_log_mle:[92m -0.14192 [0m(-0.00503)
     | > avg_loss_dur:[92m 0.86302 [0m(-0.04463)


[4m[1m > EPOCH: 935/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:49:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.79015 [0m(+0.06905)
     | > avg_log_mle:[91m -0.12513 [0m(+0.01679)
     | > avg_loss_dur:[91m 0.91528 [0m(+0.05226)


[4m[1m > EPOCH: 936/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:49:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.81132 [0m(+0.02118)
     | > avg_log_mle:[92m -0.13911 [0m(-0.01398)
     | > avg_loss_dur:[91m 0.95043 [0m(+0.03516)


[4m[1m > EPOCH: 937/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:49:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00000)
     | > avg_loss:[91m 0.82706 [0m(+0.01574)
     | > avg_log_mle:[91m -0.11587 [0m(+0.02324)
     | > avg_loss_dur:[92m 0.94293 [0m(-0.00750)


[4m[1m > EPOCH: 938/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:49:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01101 [0m(+0.00300)
     | > avg_loss:[92m 0.81697 [0m(-0.01009)
     | > avg_log_mle:[92m -0.12262 [0m(-0.00675)
     | > avg_loss_dur:[92m 0.93959 [0m(-0.00335)


[4m[1m > EPOCH: 939/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:50:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00200)
     | > avg_loss:[91m 0.82567 [0m(+0.00870)
     | > avg_log_mle:[92m -0.12435 [0m(-0.00173)
     | > avg_loss_dur:[91m 0.95002 [0m(+0.01043)


[4m[1m > EPOCH: 940/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:50:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.78858 [0m(-0.03708)
     | > avg_log_mle:[91m -0.12059 [0m(+0.00376)
     | > avg_loss_dur:[92m 0.90917 [0m(-0.04085)


[4m[1m > EPOCH: 941/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:50:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2825[0m
     | > loss: -0.92002  (-0.68741)
     | > log_mle: -0.98659  (-0.80706)
     | > loss_dur: 0.06657  (0.11965)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 30.47823  (25.27326)
     | > current_lr: 0.00024 
     | > step_time: 0.40440  (0.72262)
     | > loader_time: 0.10510  (0.26124)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.79043 [0m(+0.00184)
     | > avg_log_mle:[91m -0.11897 [0m(+0.00162)
     | > avg_loss_dur:[91m 0.90939 [0m(+0.00022)


[4m[1m > EPOCH: 942/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:50:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.79434 [0m(+0.00392)
     | > avg_log_mle:[92m -0.13895 [0m(-0.01998)
     | > avg_loss_dur:[91m 0.93329 [0m(+0.02390)


[4m[1m > EPOCH: 943/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:50:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.82532 [0m(+0.03098)
     | > avg_log_mle:[91m -0.12940 [0m(+0.00955)
     | > avg_loss_dur:[91m 0.95472 [0m(+0.02143)


[4m[1m > EPOCH: 944/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:50:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.76391 [0m(-0.06141)
     | > avg_log_mle:[92m -0.15208 [0m(-0.02268)
     | > avg_loss_dur:[92m 0.91599 [0m(-0.03873)


[4m[1m > EPOCH: 945/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:50:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.74156 [0m(-0.02235)
     | > avg_log_mle:[92m -0.16158 [0m(-0.00950)
     | > avg_loss_dur:[92m 0.90313 [0m(-0.01286)


[4m[1m > EPOCH: 946/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:51:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.75921 [0m(+0.01766)
     | > avg_log_mle:[91m -0.06187 [0m(+0.09970)
     | > avg_loss_dur:[92m 0.82108 [0m(-0.08205)


[4m[1m > EPOCH: 947/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:51:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.76463 [0m(+0.00542)
     | > avg_log_mle:[92m -0.16594 [0m(-0.10407)
     | > avg_loss_dur:[91m 0.93057 [0m(+0.10949)


[4m[1m > EPOCH: 948/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:51:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.96189 [0m(+0.19726)
     | > avg_log_mle:[91m 0.03936 [0m(+0.20531)
     | > avg_loss_dur:[92m 0.92252 [0m(-0.00805)


[4m[1m > EPOCH: 949/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:51:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.64810 [0m(-0.31379)
     | > avg_log_mle:[92m -0.19351 [0m(-0.23287)
     | > avg_loss_dur:[92m 0.84161 [0m(-0.08092)


[4m[1m > EPOCH: 950/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:51:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2850[0m
     | > loss: -0.52998  (-0.52998)
     | > log_mle: -0.66910  (-0.66910)
     | > loss_dur: 0.13912  (0.13912)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 15.61799  (15.61799)
     | > current_lr: 0.00024 
     | > step_time: 0.73570  (0.73567)
     | > loader_time: 0.31730  (0.31728)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01201 [0m(+0.00300)
     | > avg_loss:[91m 0.76257 [0m(+0.11446)
     | > avg_log_mle:[91m -0.12704 [0m(+0.06647)
     | > avg_loss_dur:[91m 0.88961 [0m(+0.04800)


[4m[1m > EPOCH: 951/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:51:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00401)
     | > avg_loss:[91m 1.03674 [0m(+0.27418)
     | > avg_log_mle:[91m -0.05861 [0m(+0.06843)
     | > avg_loss_dur:[91m 1.09535 [0m(+0.20575)


[4m[1m > EPOCH: 952/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:52:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.69241 [0m(-0.34433)
     | > avg_log_mle:[92m -0.18825 [0m(-0.12964)
     | > avg_loss_dur:[92m 0.88066 [0m(-0.21470)


[4m[1m > EPOCH: 953/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:52:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.95837 [0m(+0.26596)
     | > avg_log_mle:[91m -0.15071 [0m(+0.03754)
     | > avg_loss_dur:[91m 1.10908 [0m(+0.22842)


[4m[1m > EPOCH: 954/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:52:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.67861 [0m(-0.27977)
     | > avg_log_mle:[92m -0.18078 [0m(-0.03008)
     | > avg_loss_dur:[92m 0.85939 [0m(-0.24969)


[4m[1m > EPOCH: 955/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:52:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.76906 [0m(+0.09045)
     | > avg_log_mle:[91m -0.12077 [0m(+0.06002)
     | > avg_loss_dur:[91m 0.88983 [0m(+0.03044)


[4m[1m > EPOCH: 956/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:52:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.56727 [0m(-0.20179)
     | > avg_log_mle:[92m -0.17722 [0m(-0.05646)
     | > avg_loss_dur:[92m 0.74449 [0m(-0.14534)


[4m[1m > EPOCH: 957/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:52:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[91m 0.74137 [0m(+0.17410)
     | > avg_log_mle:[92m -0.23590 [0m(-0.05868)
     | > avg_loss_dur:[91m 0.97728 [0m(+0.23279)


[4m[1m > EPOCH: 958/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:53:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2875[0m
     | > loss: -0.28906  (-0.28906)
     | > log_mle: -0.51980  (-0.51980)
     | > loss_dur: 0.23074  (0.23074)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 24.89619  (24.89619)
     | > current_lr: 0.00024 
     | > step_time: 1.03290  (1.03294)
     | > loader_time: 0.41840  (0.41838)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.71883 [0m(-0.02254)
     | > avg_log_mle:[91m -0.17666 [0m(+0.05925)
     | > avg_loss_dur:[92m 0.89549 [0m(-0.08179)


[4m[1m > EPOCH: 959/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:53:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.51349 [0m(-0.20534)
     | > avg_log_mle:[92m -0.20412 [0m(-0.02747)
     | > avg_loss_dur:[92m 0.71762 [0m(-0.17788)


[4m[1m > EPOCH: 960/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:53:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.60438 [0m(+0.09089)
     | > avg_log_mle:[91m -0.19279 [0m(+0.01134)
     | > avg_loss_dur:[91m 0.79717 [0m(+0.07955)


[4m[1m > EPOCH: 961/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:53:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.85213 [0m(+0.24775)
     | > avg_log_mle:[92m -0.22944 [0m(-0.03665)
     | > avg_loss_dur:[91m 1.08157 [0m(+0.28440)


[4m[1m > EPOCH: 962/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:53:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.92180 [0m(+0.06967)
     | > avg_log_mle:[91m -0.20966 [0m(+0.01978)
     | > avg_loss_dur:[91m 1.13146 [0m(+0.04990)


[4m[1m > EPOCH: 963/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:53:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.60030 [0m(-0.32150)
     | > avg_log_mle:[92m -0.22440 [0m(-0.01475)
     | > avg_loss_dur:[92m 0.82470 [0m(-0.30676)


[4m[1m > EPOCH: 964/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:54:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.51644 [0m(-0.08386)
     | > avg_log_mle:[91m -0.18008 [0m(+0.04433)
     | > avg_loss_dur:[92m 0.69652 [0m(-0.12819)


[4m[1m > EPOCH: 965/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:54:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.62425 [0m(+0.10781)
     | > avg_log_mle:[92m -0.19630 [0m(-0.01622)
     | > avg_loss_dur:[91m 0.82055 [0m(+0.12404)


[4m[1m > EPOCH: 966/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:54:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2900[0m
     | > loss: -0.78893  (-0.56226)
     | > log_mle: -0.90877  (-0.74393)
     | > loss_dur: 0.11984  (0.18166)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 49.96672  (31.23040)
     | > current_lr: 0.00024 
     | > step_time: 0.40540  (0.72016)
     | > loader_time: 0.10210  (0.26973)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.67639 [0m(+0.05214)
     | > avg_log_mle:[92m -0.20255 [0m(-0.00625)
     | > avg_loss_dur:[91m 0.87894 [0m(+0.05839)


[4m[1m > EPOCH: 967/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:54:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.55899 [0m(-0.11740)
     | > avg_log_mle:[91m -0.17107 [0m(+0.03148)
     | > avg_loss_dur:[92m 0.73006 [0m(-0.14888)


[4m[1m > EPOCH: 968/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:54:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[92m 0.54776 [0m(-0.01123)
     | > avg_log_mle:[92m -0.19994 [0m(-0.02887)
     | > avg_loss_dur:[91m 0.74770 [0m(+0.01764)


[4m[1m > EPOCH: 969/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:54:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.72778 [0m(+0.18002)
     | > avg_log_mle:[91m -0.18265 [0m(+0.01729)
     | > avg_loss_dur:[91m 0.91043 [0m(+0.16273)


[4m[1m > EPOCH: 970/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:54:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.78669 [0m(+0.05891)
     | > avg_log_mle:[91m -0.17292 [0m(+0.00973)
     | > avg_loss_dur:[91m 0.95961 [0m(+0.04918)


[4m[1m > EPOCH: 971/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:55:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.76298 [0m(-0.02371)
     | > avg_log_mle:[91m -0.16172 [0m(+0.01120)
     | > avg_loss_dur:[92m 0.92471 [0m(-0.03490)


[4m[1m > EPOCH: 972/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:55:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[92m 0.73397 [0m(-0.02901)
     | > avg_log_mle:[91m -0.14856 [0m(+0.01316)
     | > avg_loss_dur:[92m 0.88254 [0m(-0.04217)


[4m[1m > EPOCH: 973/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:55:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00000)
     | > avg_loss:[91m 0.74989 [0m(+0.01592)
     | > avg_log_mle:[91m -0.14323 [0m(+0.00534)
     | > avg_loss_dur:[91m 0.89312 [0m(+0.01058)


[4m[1m > EPOCH: 974/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:55:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.74681 [0m(-0.00308)
     | > avg_log_mle:[92m -0.14655 [0m(-0.00332)
     | > avg_loss_dur:[91m 0.89336 [0m(+0.00024)


[4m[1m > EPOCH: 975/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:55:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/3 -- GLOBAL_STEP: 2925[0m
     | > loss: -0.56705  (-0.56705)
     | > log_mle: -0.72658  (-0.72658)
     | > loss_dur: 0.15953  (0.15953)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 46.58623  (46.58623)
     | > current_lr: 0.00024 
     | > step_time: 0.72370  (0.72366)
     | > loader_time: 0.31730  (0.31729)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.82960 [0m(+0.08278)
     | > avg_log_mle:[92m -0.14953 [0m(-0.00299)
     | > avg_loss_dur:[91m 0.97913 [0m(+0.08577)


[4m[1m > EPOCH: 976/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:55:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.87925 [0m(+0.04965)
     | > avg_log_mle:[91m -0.12232 [0m(+0.02722)
     | > avg_loss_dur:[91m 1.00157 [0m(+0.02244)


[4m[1m > EPOCH: 977/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:56:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.81015 [0m(-0.06910)
     | > avg_log_mle:[92m -0.13709 [0m(-0.01478)
     | > avg_loss_dur:[92m 0.94724 [0m(-0.05433)


[4m[1m > EPOCH: 978/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:56:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.87290 [0m(+0.06275)
     | > avg_log_mle:[91m -0.11858 [0m(+0.01851)
     | > avg_loss_dur:[91m 0.99148 [0m(+0.04424)


[4m[1m > EPOCH: 979/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:56:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[92m 0.85744 [0m(-0.01545)
     | > avg_log_mle:[92m -0.12045 [0m(-0.00187)
     | > avg_loss_dur:[92m 0.97789 [0m(-0.01358)


[4m[1m > EPOCH: 980/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:56:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[91m 0.87465 [0m(+0.01721)
     | > avg_log_mle:[92m -0.12829 [0m(-0.00784)
     | > avg_loss_dur:[91m 1.00294 [0m(+0.02505)


[4m[1m > EPOCH: 981/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:56:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.88521 [0m(+0.01056)
     | > avg_log_mle:[91m -0.10128 [0m(+0.02702)
     | > avg_loss_dur:[92m 0.98649 [0m(-0.01646)


[4m[1m > EPOCH: 982/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:56:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.83121 [0m(-0.05400)
     | > avg_log_mle:[92m -0.11820 [0m(-0.01692)
     | > avg_loss_dur:[92m 0.94940 [0m(-0.03708)


[4m[1m > EPOCH: 983/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:56:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/3 -- GLOBAL_STEP: 2950[0m
     | > loss: -0.46203  (-0.46203)
     | > log_mle: -0.64309  (-0.64309)
     | > loss_dur: 0.18107  (0.18107)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 39.93357  (39.93357)
     | > current_lr: 0.00025 
     | > step_time: 1.03800  (1.03796)
     | > loader_time: 0.42040  (0.42038)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.85066 [0m(+0.01945)
     | > avg_log_mle:[91m -0.08900 [0m(+0.02920)
     | > avg_loss_dur:[92m 0.93966 [0m(-0.00975)


[4m[1m > EPOCH: 984/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:57:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.82159 [0m(-0.02906)
     | > avg_log_mle:[92m -0.13492 [0m(-0.04592)
     | > avg_loss_dur:[91m 0.95651 [0m(+0.01686)


[4m[1m > EPOCH: 985/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:57:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.86755 [0m(+0.04596)
     | > avg_log_mle:[91m -0.11033 [0m(+0.02458)
     | > avg_loss_dur:[91m 0.97789 [0m(+0.02138)


[4m[1m > EPOCH: 986/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:57:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.89401 [0m(+0.02646)
     | > avg_log_mle:[91m -0.06380 [0m(+0.04653)
     | > avg_loss_dur:[92m 0.95782 [0m(-0.02007)


[4m[1m > EPOCH: 987/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:57:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.86045 [0m(-0.03357)
     | > avg_log_mle:[92m -0.10554 [0m(-0.04174)
     | > avg_loss_dur:[91m 0.96599 [0m(+0.00817)


[4m[1m > EPOCH: 988/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:57:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[91m 0.86188 [0m(+0.00143)
     | > avg_log_mle:[92m -0.10763 [0m(-0.00209)
     | > avg_loss_dur:[91m 0.96951 [0m(+0.00352)


[4m[1m > EPOCH: 989/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:57:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00100)
     | > avg_loss:[91m 0.89102 [0m(+0.02915)
     | > avg_log_mle:[91m -0.07650 [0m(+0.03114)
     | > avg_loss_dur:[92m 0.96752 [0m(-0.00199)


[4m[1m > EPOCH: 990/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:58:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00901 [0m(-0.00100)
     | > avg_loss:[92m 0.86764 [0m(-0.02338)
     | > avg_log_mle:[92m -0.09385 [0m(-0.01735)
     | > avg_loss_dur:[92m 0.96149 [0m(-0.00604)


[4m[1m > EPOCH: 991/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:58:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/3 -- GLOBAL_STEP: 2975[0m
     | > loss: -0.95114  (-0.71691)
     | > log_mle: -1.01152  (-0.83384)
     | > loss_dur: 0.06038  (0.11693)
     | > amp_scaler: 4096.00000  (4096.00000)
     | > grad_norm: 238.43488  (125.30862)
     | > current_lr: 0.00025 
     | > step_time: 0.40140  (0.72066)
     | > loader_time: 0.10310  (0.25773)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.86536 [0m(-0.00228)
     | > avg_log_mle:[91m -0.02099 [0m(+0.07286)
     | > avg_loss_dur:[92m 0.88635 [0m(-0.07514)


[4m[1m > EPOCH: 992/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:58:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.83251 [0m(-0.03285)
     | > avg_log_mle:[92m -0.11767 [0m(-0.09668)
     | > avg_loss_dur:[91m 0.95018 [0m(+0.06384)


[4m[1m > EPOCH: 993/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:58:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.82886 [0m(-0.00365)
     | > avg_log_mle:[92m -0.12907 [0m(-0.01139)
     | > avg_loss_dur:[91m 0.95793 [0m(+0.00775)


[4m[1m > EPOCH: 994/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:58:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00801 [0m(+0.00000)
     | > avg_loss:[92m 0.78569 [0m(-0.04318)
     | > avg_log_mle:[91m -0.08536 [0m(+0.04371)
     | > avg_loss_dur:[92m 0.87105 [0m(-0.08689)


[4m[1m > EPOCH: 995/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:58:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00100)
     | > avg_loss:[91m 0.95340 [0m(+0.16771)
     | > avg_log_mle:[92m -0.08684 [0m(-0.00148)
     | > avg_loss_dur:[91m 1.04024 [0m(+0.16919)


[4m[1m > EPOCH: 996/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:59:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.00901 [0m(+0.00000)
     | > avg_loss:[92m 0.92910 [0m(-0.02430)
     | > avg_log_mle:[92m -0.09164 [0m(-0.00480)
     | > avg_loss_dur:[92m 1.02073 [0m(-0.01950)


[4m[1m > EPOCH: 997/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:59:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00100)
     | > avg_loss:[92m 0.91590 [0m(-0.01320)
     | > avg_log_mle:[91m -0.08969 [0m(+0.00195)
     | > avg_loss_dur:[92m 1.00558 [0m(-0.01515)


[4m[1m > EPOCH: 998/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:59:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.01001 [0m(+0.00200)
     | > avg_loss:[92m 0.86768 [0m(-0.04822)
     | > avg_log_mle:[92m -0.10486 [0m(-0.01517)
     | > avg_loss_dur:[92m 0.97254 [0m(-0.03305)


[4m[1m > EPOCH: 999/1000[0m
 --> D:\data\TIMIT\run-September-09-2022_04+29AM-75f2436

[1m > TRAINING (2022-09-09 06:59:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 139
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 22
 | > Avg text length: 49.46762589928058
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 27302.0
 | > Avg audio length: 67225.14388489208
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
	| > 1 not found characters:
	| > ͡
| > Number of instances : 1
 | > Preprocessing samples
 | > Max text length: 38
 | > Min text length: 38
 | > Avg text length: 38.0
 | 
 | > Max audio length: 50020.0
 | > Min audio length: 50020.0
 | > Avg audio length: 50020.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.00801 [0m(-0.00200)
     | > avg_loss:[92m 0.84405 [0m(-0.02363)
     | > avg_log_mle:[91m -0.08234 [0m(+0.02252)
     | > avg_loss_dur:[92m 0.92639 [0m(-0.04615)

