In [1]:
import os

from trainer import Trainer, TrainerArgs

from TTS.config.shared_configs import BaseAudioConfig
from TTS.tts.configs.glow_tts_config import GlowTTSConfig
from TTS.tts.configs.shared_configs import BaseDatasetConfig
from TTS.tts.datasets import load_tts_samples
from TTS.tts.models.glow_tts import GlowTTS
from TTS.tts.utils.speakers import SpeakerManager
from TTS.tts.utils.text.tokenizer import TTSTokenizer
from TTS.utils.audio import AudioProcessor



In [2]:
dataset_path = 'D:\data\TIMIT\TRAIN'
output_path = './output'

In [3]:
# define dataset config
# need to use vctk_old format if using wav files instead of flac

dataset_config = BaseDatasetConfig(name="vctk_old", meta_file_train="", language='en-us', path=dataset_path)

In [4]:
# define audio config

audio_config = BaseAudioConfig(sample_rate=22050,
                               preemphasis=0.98,
                               power=1.2,
                               ref_level_db=2,
                               resample=True, 
                               do_trim_silence=False, 
                               trim_db=23.0)

In [5]:
# define model config

config = GlowTTSConfig(
    batch_size=64,
    eval_batch_size=16,
    num_loader_workers=0,
    num_eval_loader_workers=0,
    precompute_num_workers=0,
    run_eval=True,
    test_delay_epochs=-1,
    epochs=1000,
    text_cleaner="phoneme_cleaners",
    use_phonemes=True,
    phoneme_language="en-us",
    phoneme_cache_path=os.path.join(output_path, "phoneme_cache"),
    print_step=25,
    print_eval=False,
    mixed_precision=True,
    output_path=output_path,
    datasets=[dataset_config],
    use_speaker_embedding=True,
    min_text_len=0,
    max_text_len=500,
    min_audio_len=0,
    max_audio_len=500000,
)

In [6]:
# INITIALIZE THE AUDIO PROCESSOR
# Audio processor is used for feature extraction and audio I/O.
# It mainly serves to the dataloader and the training loggers.
ap = AudioProcessor.init_from_config(audio_config)

 > Setting up Audio Processor...
 | > sample_rate:22050
 | > resample:True
 | > num_mels:80
 | > log_func:np.log10
 | > min_level_db:-100
 | > frame_shift_ms:None
 | > frame_length_ms:None
 | > ref_level_db:2
 | > fft_size:1024
 | > power:1.2
 | > preemphasis:0.98
 | > griffin_lim_iters:60
 | > signal_norm:True
 | > symmetric_norm:True
 | > mel_fmin:0
 | > mel_fmax:None
 | > pitch_fmin:0.0
 | > pitch_fmax:640.0
 | > spec_gain:20.0
 | > stft_pad_mode:reflect
 | > max_norm:4.0
 | > clip_norm:True
 | > do_trim_silence:False
 | > trim_db:23.0
 | > do_sound_norm:False
 | > do_amp_to_db_linear:True
 | > do_amp_to_db_mel:True
 | > do_rms_norm:False
 | > db_level:None
 | > stats_path:None
 | > base:10
 | > hop_length:256
 | > win_length:1024


In [7]:
# INITIALIZE THE TOKENIZER
# Tokenizer is used to convert text to sequences of token IDs.
# If characters are not defined in the config, default characters are passed to the config
tokenizer, config = TTSTokenizer.init_from_config(config)

In [8]:
# LOAD DATA SAMPLES
# Each sample is a list of ```[text, audio_file_path, speaker_name]```

train_samples, eval_samples = load_tts_samples(
    dataset_config,
    eval_split=True,
    eval_split_max_size=config.eval_split_max_size,
    eval_split_size=config.eval_split_size,
)

 | > Found 1140 files in D:\data\TIMIT\TRAIN


In [9]:
# init speaker manager for multi-speaker training

speaker_manager = SpeakerManager()
speaker_manager.set_ids_from_data(train_samples + eval_samples, parse_key="speaker_name")
config.num_speakers = speaker_manager.num_speakers

In [10]:
# init model
model = GlowTTS(config, ap, tokenizer, speaker_manager=speaker_manager)

 > Init speaker_embedding layer.


In [11]:
# INITIALIZE THE TRAINER

trainer = Trainer(
    TrainerArgs(), config, output_path, model=model, train_samples=train_samples, eval_samples=eval_samples
)

 > Using CUDA: True
 > Number of GPUs: 1

 > Model has 32355409 parameters


 > `speakers.pth` is saved to ./output\run-September-15-2022_04+45AM-910d77a\speakers.pth.
 > `speakers_file` is updated in the config.json.


In [12]:
trainer.fit()


[4m[1m > EPOCH: 0/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:45:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 0[0m
     | > current_lr: 0.00000 
     | > step_time: 1.26110  (1.26107)
     | > loader_time: 0.29230  (0.29226)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07407 [0m(+0.00000)
     | > avg_loss: 3.29431 [0m(+0.00000)
     | > avg_log_mle: 0.54783 [0m(+0.00000)
     | > avg_loss_dur: 2.74648 [0m(+0.00000)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_18.pth

[4m[1m > EPOCH: 1/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:46:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 25[0m
     | > loss: 3.45478  (3.33000)
     | > log_mle: 0.57556  (0.57569)
     | > loss_dur: 2.87923  (2.75430)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.61162  (8.33781)
     | > current_lr: 0.00000 
     | > step_time: 0.82470  (0.86414)
     | > loader_time: 0.41540  (0.43254)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.01101)
     | > avg_loss:[92m 3.29323 [0m(-0.00108)
     | > avg_log_mle:[92m 0.54779 [0m(-0.00004)
     | > avg_loss_dur:[92m 2.74543 [0m(-0.00104)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_36.pth

[4m[1m > EPOCH: 2/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:46:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 50[0m
     | > loss: 3.53581  (3.40566)
     | > log_mle: 0.58076  (0.57516)
     | > loss_dur: 2.95505  (2.83050)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.62311  (8.46199)
     | > current_lr: 0.00000 
     | > step_time: 1.02490  (0.74704)
     | > loader_time: 0.63160  (0.48079)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01501)
     | > avg_loss:[92m 3.28956 [0m(-0.00367)
     | > avg_log_mle:[92m 0.54767 [0m(-0.00012)
     | > avg_loss_dur:[92m 2.74189 [0m(-0.00355)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_54.pth

[4m[1m > EPOCH: 3/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:46:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00600)
     | > avg_loss:[92m 3.28446 [0m(-0.00510)
     | > avg_log_mle:[92m 0.54744 [0m(-0.00023)
     | > avg_loss_dur:[92m 2.73702 [0m(-0.00487)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_72.pth

[4m[1m > EPOCH: 4/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:47:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 75[0m
     | > loss: 3.22399  (3.27517)
     | > log_mle: 0.57283  (0.56267)
     | > loss_dur: 2.65116  (2.71251)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.16451  (8.25551)
     | > current_lr: 0.00000 
     | > step_time: 0.69260  (0.63958)
     | > loader_time: 0.44940  (0.43439)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00300)
     | > avg_loss:[92m 3.27354 [0m(-0.01092)
     | > avg_log_mle:[92m 0.54707 [0m(-0.00037)
     | > avg_loss_dur:[92m 2.72647 [0m(-0.01055)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_90.pth

[4m[1m > EPOCH: 5/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:47:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 100[0m
     | > loss: 3.42718  (3.33696)
     | > log_mle: 0.56234  (0.57306)
     | > loss_dur: 2.86483  (2.76390)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.41311  (8.26407)
     | > current_lr: 0.00000 
     | > step_time: 0.70960  (0.70044)
     | > loader_time: 0.45740  (0.42909)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00400)
     | > avg_loss:[92m 3.25895 [0m(-0.01459)
     | > avg_log_mle:[92m 0.54656 [0m(-0.00052)
     | > avg_loss_dur:[92m 2.71240 [0m(-0.01407)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_108.pth

[4m[1m > EPOCH: 6/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:48:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 125[0m
     | > loss: 3.58510  (3.39012)
     | > log_mle: 0.57949  (0.57420)
     | > loss_dur: 3.00561  (2.81592)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.62725  (8.30393)
     | > current_lr: 0.00000 
     | > step_time: 0.85480  (0.77741)
     | > loader_time: 0.41640  (0.49192)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00400)
     | > avg_loss:[92m 3.24268 [0m(-0.01627)
     | > avg_log_mle:[92m 0.54587 [0m(-0.00069)
     | > avg_loss_dur:[92m 2.69681 [0m(-0.01559)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_126.pth

[4m[1m > EPOCH: 7/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:48:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00400)
     | > avg_loss:[92m 3.20598 [0m(-0.03670)
     | > avg_log_mle:[92m 0.54498 [0m(-0.00089)
     | > avg_loss_dur:[92m 2.66100 [0m(-0.03582)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_144.pth

[4m[1m > EPOCH: 8/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:49:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 150[0m
     | > loss: 3.33697  (3.23999)
     | > log_mle: 0.59323  (0.57242)
     | > loss_dur: 2.74374  (2.66757)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.05187  (7.91558)
     | > current_lr: 0.00000 
     | > step_time: 0.64360  (0.67478)
     | > loader_time: 0.39340  (0.40503)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.01201)
     | > avg_loss:[92m 3.17726 [0m(-0.02872)
     | > avg_log_mle:[92m 0.54385 [0m(-0.00113)
     | > avg_loss_dur:[92m 2.63341 [0m(-0.02758)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_162.pth

[4m[1m > EPOCH: 9/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:49:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 175[0m
     | > loss: 3.37918  (3.30686)
     | > log_mle: 0.57539  (0.56999)
     | > loss_dur: 2.80379  (2.73687)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.98379  (7.93314)
     | > current_lr: 0.00000 
     | > step_time: 0.79570  (0.72859)
     | > loader_time: 0.54050  (0.48667)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00801)
     | > avg_loss:[91m 3.22167 [0m(+0.04441)
     | > avg_log_mle:[92m 0.54241 [0m(-0.00144)
     | > avg_loss_dur:[91m 2.67927 [0m(+0.04585)


[4m[1m > EPOCH: 10/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:50:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00100)
     | > avg_loss:[92m 3.18618 [0m(-0.03550)
     | > avg_log_mle:[92m 0.54057 [0m(-0.00184)
     | > avg_loss_dur:[92m 2.64561 [0m(-0.03366)


[4m[1m > EPOCH: 11/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:50:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 200[0m
     | > loss: 3.16218  (3.16996)
     | > log_mle: 0.53812  (0.55070)
     | > loss_dur: 2.62406  (2.61925)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.59808  (7.60502)
     | > current_lr: 0.00000 
     | > step_time: 0.57050  (0.61456)
     | > loader_time: 0.34330  (0.35032)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00701)
     | > avg_loss:[92m 3.16030 [0m(-0.02588)
     | > avg_log_mle:[92m 0.53821 [0m(-0.00235)
     | > avg_loss_dur:[92m 2.62209 [0m(-0.02352)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_216.pth

[4m[1m > EPOCH: 12/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:51:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 225[0m
     | > loss: 3.21500  (3.17204)
     | > log_mle: 0.55922  (0.56479)
     | > loss_dur: 2.65578  (2.60724)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.41825  (7.40506)
     | > current_lr: 0.00000 
     | > step_time: 0.92280  (0.70220)
     | > loader_time: 0.68160  (0.44763)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00901)
     | > avg_loss:[91m 3.16838 [0m(+0.00808)
     | > avg_log_mle:[92m 0.53519 [0m(-0.00303)
     | > avg_loss_dur:[91m 2.63319 [0m(+0.01111)


[4m[1m > EPOCH: 13/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:51:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 250[0m
     | > loss: 3.25887  (3.18932)
     | > log_mle: 0.56446  (0.56130)
     | > loss_dur: 2.69440  (2.62803)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.32599  (7.27686)
     | > current_lr: 0.00000 
     | > step_time: 0.95890  (0.76995)
     | > loader_time: 0.58750  (0.47174)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 3.15354 [0m(-0.01484)
     | > avg_log_mle:[92m 0.53130 [0m(-0.00389)
     | > avg_loss_dur:[92m 2.62224 [0m(-0.01095)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_252.pth

[4m[1m > EPOCH: 14/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:51:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06005 [0m(-0.00901)
     | > avg_loss:[92m 3.10687 [0m(-0.04667)
     | > avg_log_mle:[92m 0.52631 [0m(-0.00499)
     | > avg_loss_dur:[92m 2.58056 [0m(-0.04168)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_270.pth

[4m[1m > EPOCH: 15/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:52:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 275[0m
     | > loss: 3.08608  (3.01656)
     | > log_mle: 0.56780  (0.54983)
     | > loss_dur: 2.51828  (2.46673)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.86061  (6.77241)
     | > current_lr: 0.00000 
     | > step_time: 0.74670  (0.68102)
     | > loader_time: 0.46040  (0.41097)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.01201)
     | > avg_loss:[92m 3.08162 [0m(-0.02524)
     | > avg_log_mle:[92m 0.51997 [0m(-0.00634)
     | > avg_loss_dur:[92m 2.56165 [0m(-0.01891)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_288.pth

[4m[1m > EPOCH: 16/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:52:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 300[0m
     | > loss: 3.09264  (3.04590)
     | > log_mle: 0.54904  (0.54514)
     | > loss_dur: 2.54360  (2.50075)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.59751  (6.63021)
     | > current_lr: 0.00000 
     | > step_time: 0.92780  (0.72191)
     | > loader_time: 0.66060  (0.45550)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[92m 3.04864 [0m(-0.03298)
     | > avg_log_mle:[92m 0.51204 [0m(-0.00794)
     | > avg_loss_dur:[92m 2.53661 [0m(-0.02505)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_306.pth

[4m[1m > EPOCH: 17/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:53:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00100)
     | > avg_loss:[92m 3.02565 [0m(-0.02299)
     | > avg_log_mle:[92m 0.50229 [0m(-0.00974)
     | > avg_loss_dur:[92m 2.52336 [0m(-0.01324)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_324.pth

[4m[1m > EPOCH: 18/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:53:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 325[0m
     | > loss: 2.88680  (2.88680)
     | > log_mle: 0.52736  (0.52736)
     | > loss_dur: 2.35945  (2.35945)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.19045  (6.19045)
     | > current_lr: 0.00000 
     | > step_time: 0.65760  (0.65760)
     | > loader_time: 0.36030  (0.36033)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00601)
     | > avg_loss:[92m 2.97017 [0m(-0.05548)
     | > avg_log_mle:[92m 0.49065 [0m(-0.01164)
     | > avg_loss_dur:[92m 2.47952 [0m(-0.04384)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_342.pth

[4m[1m > EPOCH: 19/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:54:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 350[0m
     | > loss: 2.94423  (2.89262)
     | > log_mle: 0.51646  (0.51795)
     | > loss_dur: 2.42776  (2.37467)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.07509  (6.02497)
     | > current_lr: 0.00000 
     | > step_time: 0.68760  (0.67436)
     | > loader_time: 0.40140  (0.40399)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.01301)
     | > avg_loss:[92m 2.91113 [0m(-0.05904)
     | > avg_log_mle:[92m 0.47714 [0m(-0.01351)
     | > avg_loss_dur:[92m 2.43399 [0m(-0.04553)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_360.pth

[4m[1m > EPOCH: 20/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:54:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 375[0m
     | > loss: 2.98268  (2.94520)
     | > log_mle: 0.49593  (0.50221)
     | > loss_dur: 2.48676  (2.44299)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.01303  (5.98176)
     | > current_lr: 0.00000 
     | > step_time: 0.88480  (0.75736)
     | > loader_time: 0.54650  (0.45948)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.01001)
     | > avg_loss:[92m 2.89689 [0m(-0.01424)
     | > avg_log_mle:[92m 0.46211 [0m(-0.01502)
     | > avg_loss_dur:[91m 2.43478 [0m(+0.00078)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_378.pth

[4m[1m > EPOCH: 21/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:55:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00501)
     | > avg_loss:[92m 2.85502 [0m(-0.04187)
     | > avg_log_mle:[92m 0.44611 [0m(-0.01600)
     | > avg_loss_dur:[92m 2.40891 [0m(-0.02587)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_396.pth

[4m[1m > EPOCH: 22/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:55:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 400[0m
     | > loss: 2.80271  (2.77582)
     | > log_mle: 0.47742  (0.46925)
     | > loss_dur: 2.32529  (2.30657)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.70279  (5.69777)
     | > current_lr: 0.00001 
     | > step_time: 0.74170  (0.66486)
     | > loader_time: 0.48540  (0.39486)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.00601)
     | > avg_loss:[92m 2.78632 [0m(-0.06870)
     | > avg_log_mle:[92m 0.42966 [0m(-0.01645)
     | > avg_loss_dur:[92m 2.35666 [0m(-0.05224)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_414.pth

[4m[1m > EPOCH: 23/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:56:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 425[0m
     | > loss: 2.92283  (2.80484)
     | > log_mle: 0.45191  (0.45675)
     | > loss_dur: 2.47092  (2.34809)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.86497  (5.69587)
     | > current_lr: 0.00001 
     | > step_time: 0.74870  (0.70373)
     | > loader_time: 0.47340  (0.43430)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.01602)
     | > avg_loss:[92m 2.71919 [0m(-0.06713)
     | > avg_log_mle:[92m 0.41307 [0m(-0.01658)
     | > avg_loss_dur:[92m 2.30612 [0m(-0.05054)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_432.pth

[4m[1m > EPOCH: 24/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:56:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00901)
     | > avg_loss:[92m 2.66075 [0m(-0.05844)
     | > avg_log_mle:[92m 0.39639 [0m(-0.01668)
     | > avg_loss_dur:[92m 2.26437 [0m(-0.04176)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_450.pth

[4m[1m > EPOCH: 25/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:56:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 450[0m
     | > loss: 2.80786  (2.80786)
     | > log_mle: 0.42023  (0.42023)
     | > loss_dur: 2.38763  (2.38763)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.75080  (5.75080)
     | > current_lr: 0.00001 
     | > step_time: 0.63260  (0.63258)
     | > loader_time: 0.27830  (0.27825)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00300)
     | > avg_loss:[92m 2.55188 [0m(-0.10888)
     | > avg_log_mle:[92m 0.37949 [0m(-0.01690)
     | > avg_loss_dur:[92m 2.17239 [0m(-0.09198)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_468.pth

[4m[1m > EPOCH: 26/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:57:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 475[0m
     | > loss: 2.62232  (2.55233)
     | > log_mle: 0.40475  (0.41063)
     | > loss_dur: 2.21757  (2.14169)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.45438  (5.35666)
     | > current_lr: 0.00001 
     | > step_time: 0.65260  (0.66789)
     | > loader_time: 0.40740  (0.41924)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00200)
     | > avg_loss:[92m 2.45628 [0m(-0.09559)
     | > avg_log_mle:[92m 0.36209 [0m(-0.01740)
     | > avg_loss_dur:[92m 2.09420 [0m(-0.07819)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_486.pth

[4m[1m > EPOCH: 27/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:57:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 500[0m
     | > loss: 2.64134  (2.52033)
     | > log_mle: 0.39117  (0.39177)
     | > loss_dur: 2.25017  (2.12856)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.47985  (5.33630)
     | > current_lr: 0.00001 
     | > step_time: 1.02090  (0.74475)
     | > loader_time: 0.58550  (0.46778)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00300)
     | > avg_loss:[92m 2.35381 [0m(-0.10247)
     | > avg_log_mle:[92m 0.34389 [0m(-0.01819)
     | > avg_loss_dur:[92m 2.00992 [0m(-0.08428)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_504.pth

[4m[1m > EPOCH: 28/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:58:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00100)
     | > avg_loss:[92m 2.22553 [0m(-0.12828)
     | > avg_log_mle:[92m 0.32494 [0m(-0.01896)
     | > avg_loss_dur:[92m 1.90060 [0m(-0.10932)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_522.pth

[4m[1m > EPOCH: 29/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:58:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 525[0m
     | > loss: 2.20521  (2.23719)
     | > log_mle: 0.35795  (0.35076)
     | > loss_dur: 1.84726  (1.88643)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.93663  (5.00734)
     | > current_lr: 0.00001 
     | > step_time: 0.68160  (0.63258)
     | > loader_time: 0.40240  (0.42505)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06406 [0m(+0.00100)
     | > avg_loss:[92m 2.10867 [0m(-0.11686)
     | > avg_log_mle:[92m 0.30531 [0m(-0.01962)
     | > avg_loss_dur:[92m 1.80336 [0m(-0.09724)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_540.pth

[4m[1m > EPOCH: 30/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:59:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 550[0m
     | > loss: 2.25865  (2.19092)
     | > log_mle: 0.32711  (0.33967)
     | > loss_dur: 1.93154  (1.85125)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.00044  (4.90142)
     | > current_lr: 0.00001 
     | > step_time: 0.71260  (0.68913)
     | > loader_time: 0.44740  (0.42989)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00000)
     | > avg_loss:[92m 2.00464 [0m(-0.10403)
     | > avg_log_mle:[92m 0.28519 [0m(-0.02013)
     | > avg_loss_dur:[92m 1.71946 [0m(-0.08390)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_558.pth

[4m[1m > EPOCH: 31/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 04:59:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 575[0m
     | > loss: 2.26633  (2.13151)
     | > log_mle: 0.31696  (0.31928)
     | > loss_dur: 1.94937  (1.81223)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.95293  (4.77783)
     | > current_lr: 0.00001 
     | > step_time: 0.83980  (0.76423)
     | > loader_time: 0.43740  (0.49804)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.01101)
     | > avg_loss:[92m 1.88361 [0m(-0.12104)
     | > avg_log_mle:[92m 0.26465 [0m(-0.02054)
     | > avg_loss_dur:[92m 1.61896 [0m(-0.10050)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_576.pth

[4m[1m > EPOCH: 32/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:00:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00400)
     | > avg_loss:[92m 1.81408 [0m(-0.06953)
     | > avg_log_mle:[92m 0.24465 [0m(-0.01999)
     | > avg_loss_dur:[92m 1.56942 [0m(-0.04954)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_594.pth

[4m[1m > EPOCH: 33/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:00:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 600[0m
     | > loss: 1.93466  (1.87504)
     | > log_mle: 0.30387  (0.28724)
     | > loss_dur: 1.63080  (1.58780)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.31533  (4.28055)
     | > current_lr: 0.00001 
     | > step_time: 0.62960  (0.66377)
     | > loader_time: 0.40440  (0.40520)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00701)
     | > avg_loss:[92m 1.74746 [0m(-0.06662)
     | > avg_log_mle:[92m 0.22625 [0m(-0.01840)
     | > avg_loss_dur:[92m 1.52121 [0m(-0.04821)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_612.pth

[4m[1m > EPOCH: 34/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:01:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 625[0m
     | > loss: 1.96306  (1.84918)
     | > log_mle: 0.26824  (0.26693)
     | > loss_dur: 1.69481  (1.58225)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.29129  (4.17031)
     | > current_lr: 0.00001 
     | > step_time: 0.77770  (0.71604)
     | > loader_time: 0.48140  (0.44248)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.01301)
     | > avg_loss:[92m 1.68693 [0m(-0.06053)
     | > avg_log_mle:[92m 0.20986 [0m(-0.01639)
     | > avg_loss_dur:[92m 1.47707 [0m(-0.04414)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_630.pth

[4m[1m > EPOCH: 35/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:01:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00801)
     | > avg_loss:[92m 1.62894 [0m(-0.05799)
     | > avg_log_mle:[92m 0.19522 [0m(-0.01464)
     | > avg_loss_dur:[92m 1.43372 [0m(-0.04335)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_648.pth

[4m[1m > EPOCH: 36/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:01:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 650[0m
     | > loss: 1.65537  (1.65171)
     | > log_mle: 0.20908  (0.22333)
     | > loss_dur: 1.44629  (1.42838)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.82684  (3.80284)
     | > current_lr: 0.00001 
     | > step_time: 0.55450  (0.60005)
     | > loader_time: 0.34630  (0.42889)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[92m 1.57062 [0m(-0.05832)
     | > avg_log_mle:[92m 0.18214 [0m(-0.01308)
     | > avg_loss_dur:[92m 1.38848 [0m(-0.04524)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_666.pth

[4m[1m > EPOCH: 37/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:02:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 675[0m
     | > loss: 1.67825  (1.62669)
     | > log_mle: 0.22682  (0.22582)
     | > loss_dur: 1.45143  (1.40087)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.80438  (3.71393)
     | > current_lr: 0.00001 
     | > step_time: 0.86880  (0.68740)
     | > loader_time: 0.57250  (0.43284)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00601)
     | > avg_loss:[92m 1.51822 [0m(-0.05240)
     | > avg_log_mle:[92m 0.17036 [0m(-0.01177)
     | > avg_loss_dur:[92m 1.34786 [0m(-0.04062)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_684.pth

[4m[1m > EPOCH: 38/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:02:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 700[0m
     | > loss: 1.66607  (1.61203)
     | > log_mle: 0.20341  (0.21274)
     | > loss_dur: 1.46266  (1.39929)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.75023  (3.64917)
     | > current_lr: 0.00001 
     | > step_time: 0.94890  (0.75913)
     | > loader_time: 0.62260  (0.49901)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.00701)
     | > avg_loss:[92m 1.46741 [0m(-0.05081)
     | > avg_log_mle:[92m 0.15965 [0m(-0.01071)
     | > avg_loss_dur:[92m 1.30776 [0m(-0.04010)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_702.pth

[4m[1m > EPOCH: 39/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:03:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01301)
     | > avg_loss:[92m 1.42073 [0m(-0.04668)
     | > avg_log_mle:[92m 0.14976 [0m(-0.00989)
     | > avg_loss_dur:[92m 1.27096 [0m(-0.03680)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_720.pth

[4m[1m > EPOCH: 40/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:03:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 725[0m
     | > loss: 1.47800  (1.44456)
     | > log_mle: 0.21077  (0.19104)
     | > loss_dur: 1.26723  (1.25352)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.32731  (3.32474)
     | > current_lr: 0.00001 
     | > step_time: 0.73670  (0.67041)
     | > loader_time: 0.42540  (0.40837)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00100)
     | > avg_loss:[92m 1.37668 [0m(-0.04405)
     | > avg_log_mle:[92m 0.14044 [0m(-0.00932)
     | > avg_loss_dur:[92m 1.23624 [0m(-0.03473)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_738.pth

[4m[1m > EPOCH: 41/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:04:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 750[0m
     | > loss: 1.51850  (1.45413)
     | > log_mle: 0.18835  (0.18359)
     | > loss_dur: 1.33014  (1.27053)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.35983  (3.30961)
     | > current_lr: 0.00001 
     | > step_time: 0.90880  (0.71131)
     | > loader_time: 0.67160  (0.45425)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00300)
     | > avg_loss:[92m 1.34458 [0m(-0.03210)
     | > avg_log_mle:[92m 0.13128 [0m(-0.00916)
     | > avg_loss_dur:[92m 1.21330 [0m(-0.02294)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_756.pth

[4m[1m > EPOCH: 42/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:04:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.01001)
     | > avg_loss:[92m 1.30954 [0m(-0.03504)
     | > avg_log_mle:[92m 0.12229 [0m(-0.00899)
     | > avg_loss_dur:[92m 1.18725 [0m(-0.02604)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_774.pth

[4m[1m > EPOCH: 43/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:05:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 775[0m
     | > loss: 1.31645  (1.31645)
     | > log_mle: 0.16298  (0.16298)
     | > loss_dur: 1.15347  (1.15347)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.03813  (3.03813)
     | > current_lr: 0.00001 
     | > step_time: 0.65260  (0.65259)
     | > loader_time: 0.53950  (0.53949)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[92m 1.27803 [0m(-0.03152)
     | > avg_log_mle:[92m 0.11344 [0m(-0.00885)
     | > avg_loss_dur:[92m 1.16459 [0m(-0.02266)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_792.pth

[4m[1m > EPOCH: 44/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:05:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 800[0m
     | > loss: 1.33904  (1.31561)
     | > log_mle: 0.15362  (0.15642)
     | > loss_dur: 1.18542  (1.15920)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.06909  (3.02080)
     | > current_lr: 0.00001 
     | > step_time: 0.67260  (0.66198)
     | > loader_time: 0.41840  (0.41876)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07407 [0m(-0.00200)
     | > avg_loss:[92m 1.25843 [0m(-0.01959)
     | > avg_log_mle:[92m 0.10421 [0m(-0.00922)
     | > avg_loss_dur:[92m 1.15422 [0m(-0.01037)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_810.pth

[4m[1m > EPOCH: 45/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:06:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 825[0m
     | > loss: 1.35458  (1.32831)
     | > log_mle: 0.13827  (0.14674)
     | > loss_dur: 1.21631  (1.18157)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.13996  (3.03846)
     | > current_lr: 0.00001 
     | > step_time: 0.86880  (0.74922)
     | > loader_time: 0.53850  (0.47123)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.01001)
     | > avg_loss:[92m 1.22648 [0m(-0.03196)
     | > avg_log_mle:[92m 0.09539 [0m(-0.00882)
     | > avg_loss_dur:[92m 1.13108 [0m(-0.02314)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_828.pth

[4m[1m > EPOCH: 46/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:06:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00801)
     | > avg_loss:[92m 1.21180 [0m(-0.01468)
     | > avg_log_mle:[92m 0.08671 [0m(-0.00868)
     | > avg_loss_dur:[92m 1.12509 [0m(-0.00599)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_846.pth

[4m[1m > EPOCH: 47/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:07:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 850[0m
     | > loss: 1.20507  (1.19395)
     | > log_mle: 0.13055  (0.12182)
     | > loss_dur: 1.07452  (1.07213)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.80231  (2.82809)
     | > current_lr: 0.00001 
     | > step_time: 0.73470  (0.65560)
     | > loader_time: 0.65760  (0.43865)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.01101)
     | > avg_loss:[92m 1.18222 [0m(-0.02958)
     | > avg_log_mle:[92m 0.07825 [0m(-0.00846)
     | > avg_loss_dur:[92m 1.10396 [0m(-0.02113)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_864.pth

[4m[1m > EPOCH: 48/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:07:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 875[0m
     | > loss: 1.29909  (1.21936)
     | > log_mle: 0.11881  (0.12000)
     | > loss_dur: 1.18027  (1.09936)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.94828  (2.84105)
     | > current_lr: 0.00001 
     | > step_time: 0.72870  (0.68999)
     | > loader_time: 0.41940  (0.41347)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00500)
     | > avg_loss:[92m 1.15099 [0m(-0.03122)
     | > avg_log_mle:[92m 0.07020 [0m(-0.00805)
     | > avg_loss_dur:[92m 1.08080 [0m(-0.02317)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_882.pth

[4m[1m > EPOCH: 49/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:08:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 1.12631 [0m(-0.02468)
     | > avg_log_mle:[92m 0.06267 [0m(-0.00753)
     | > avg_loss_dur:[92m 1.06364 [0m(-0.01715)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_900.pth

[4m[1m > EPOCH: 50/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:08:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 900[0m
     | > loss: 1.21513  (1.21513)
     | > log_mle: 0.08888  (0.08888)
     | > loss_dur: 1.12625  (1.12625)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.94121  (2.94121)
     | > current_lr: 0.00001 
     | > step_time: 0.49650  (0.49645)
     | > loader_time: 0.27220  (0.27225)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00701)
     | > avg_loss:[92m 1.10606 [0m(-0.02025)
     | > avg_log_mle:[92m 0.05553 [0m(-0.00714)
     | > avg_loss_dur:[92m 1.05053 [0m(-0.01311)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_918.pth

[4m[1m > EPOCH: 51/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:09:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 925[0m
     | > loss: 1.16725  (1.11744)
     | > log_mle: 0.09305  (0.09738)
     | > loss_dur: 1.07420  (1.02007)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.78319  (2.65894)
     | > current_lr: 0.00001 
     | > step_time: 0.64360  (0.66117)
     | > loader_time: 0.41640  (0.41323)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00901)
     | > avg_loss:[92m 1.07742 [0m(-0.02865)
     | > avg_log_mle:[92m 0.04826 [0m(-0.00727)
     | > avg_loss_dur:[92m 1.02915 [0m(-0.02138)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_936.pth

[4m[1m > EPOCH: 52/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:09:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 950[0m
     | > loss: 1.23538  (1.13922)
     | > log_mle: 0.09403  (0.08970)
     | > loss_dur: 1.14135  (1.04951)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.87203  (2.67486)
     | > current_lr: 0.00001 
     | > step_time: 1.01290  (0.73653)
     | > loader_time: 0.60860  (0.46549)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00701)
     | > avg_loss:[92m 1.05260 [0m(-0.02482)
     | > avg_log_mle:[92m 0.04126 [0m(-0.00700)
     | > avg_loss_dur:[92m 1.01133 [0m(-0.01782)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_954.pth

[4m[1m > EPOCH: 53/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:09:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00601)
     | > avg_loss:[92m 1.03759 [0m(-0.01501)
     | > avg_log_mle:[92m 0.03443 [0m(-0.00684)
     | > avg_loss_dur:[92m 1.00317 [0m(-0.00817)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_972.pth

[4m[1m > EPOCH: 54/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:10:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 975[0m
     | > loss: 1.01153  (1.02106)
     | > log_mle: 0.07566  (0.06560)
     | > loss_dur: 0.93587  (0.95546)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.44073  (2.50679)
     | > current_lr: 0.00001 
     | > step_time: 0.68160  (0.62757)
     | > loader_time: 0.39940  (0.36833)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00100)
     | > avg_loss:[92m 1.01072 [0m(-0.02687)
     | > avg_log_mle:[92m 0.02778 [0m(-0.00664)
     | > avg_loss_dur:[92m 0.98294 [0m(-0.02023)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_990.pth

[4m[1m > EPOCH: 55/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:10:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 1000[0m
     | > loss: 1.10344  (1.04276)
     | > log_mle: 0.06172  (0.06742)
     | > loss_dur: 1.04172  (0.97535)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.67470  (2.49780)
     | > current_lr: 0.00001 
     | > step_time: 0.69460  (0.68773)
     | > loader_time: 0.41640  (0.47413)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00400)
     | > avg_loss:[92m 1.00021 [0m(-0.01050)
     | > avg_log_mle:[92m 0.02116 [0m(-0.00662)
     | > avg_loss_dur:[92m 0.97905 [0m(-0.00388)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1008.pth

[4m[1m > EPOCH: 56/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:11:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 1025[0m
     | > loss: 1.18141  (1.06022)
     | > log_mle: 0.06177  (0.06061)
     | > loss_dur: 1.11964  (0.99961)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.77472  (2.53645)
     | > current_lr: 0.00001 
     | > step_time: 0.84280  (0.76505)
     | > loader_time: 0.43940  (0.48120)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00100)
     | > avg_loss:[92m 0.96947 [0m(-0.03075)
     | > avg_log_mle:[92m 0.01460 [0m(-0.00656)
     | > avg_loss_dur:[92m 0.95487 [0m(-0.02419)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1026.pth

[4m[1m > EPOCH: 57/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:11:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[92m 0.94485 [0m(-0.02462)
     | > avg_log_mle:[92m 0.00796 [0m(-0.00664)
     | > avg_loss_dur:[92m 0.93689 [0m(-0.01798)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1044.pth

[4m[1m > EPOCH: 58/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:12:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 1050[0m
     | > loss: 1.01074  (0.95966)
     | > log_mle: 0.06660  (0.04905)
     | > loss_dur: 0.94414  (0.91061)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.28873  (2.28225)
     | > current_lr: 0.00001 
     | > step_time: 0.63560  (0.66744)
     | > loader_time: 0.41540  (0.41237)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00200)
     | > avg_loss:[92m 0.92510 [0m(-0.01974)
     | > avg_log_mle:[92m 0.00180 [0m(-0.00615)
     | > avg_loss_dur:[92m 0.92330 [0m(-0.01359)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1062.pth

[4m[1m > EPOCH: 59/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:12:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 1075[0m
     | > loss: 1.07277  (0.97785)
     | > log_mle: 0.04604  (0.04061)
     | > loss_dur: 1.02672  (0.93724)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.52070  (2.37112)
     | > current_lr: 0.00001 
     | > step_time: 0.77670  (0.71380)
     | > loader_time: 0.51350  (0.44263)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[92m 0.91086 [0m(-0.01424)
     | > avg_log_mle:[92m -0.00488 [0m(-0.00669)
     | > avg_loss_dur:[92m 0.91575 [0m(-0.00755)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1080.pth

[4m[1m > EPOCH: 60/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:13:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00200)
     | > avg_loss:[92m 0.88835 [0m(-0.02251)
     | > avg_log_mle:[92m -0.01141 [0m(-0.00653)
     | > avg_loss_dur:[92m 0.89976 [0m(-0.01599)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1098.pth

[4m[1m > EPOCH: 61/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:13:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 1100[0m
     | > loss: 0.88706  (0.89194)
     | > log_mle: 0.00227  (0.01343)
     | > loss_dur: 0.88479  (0.87851)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.28650  (2.23297)
     | > current_lr: 0.00002 
     | > step_time: 0.55650  (0.60255)
     | > loader_time: 0.35630  (0.35732)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[92m 0.87033 [0m(-0.01802)
     | > avg_log_mle:[92m -0.01805 [0m(-0.00664)
     | > avg_loss_dur:[92m 0.88838 [0m(-0.01138)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1116.pth

[4m[1m > EPOCH: 62/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:14:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 1125[0m
     | > loss: 0.92805  (0.90079)
     | > log_mle: 0.01745  (0.02038)
     | > loss_dur: 0.91060  (0.88041)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.24035  (2.15079)
     | > current_lr: 0.00002 
     | > step_time: 0.86880  (0.68485)
     | > loader_time: 0.59250  (0.43239)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00100)
     | > avg_loss:[92m 0.84576 [0m(-0.02457)
     | > avg_log_mle:[92m -0.02445 [0m(-0.00640)
     | > avg_loss_dur:[92m 0.87021 [0m(-0.01817)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1134.pth

[4m[1m > EPOCH: 63/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:14:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 1150[0m
     | > loss: 0.96318  (0.91579)
     | > log_mle: 0.00858  (0.01283)
     | > loss_dur: 0.95459  (0.90296)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.37330  (2.19074)
     | > current_lr: 0.00002 
     | > step_time: 0.95990  (0.75919)
     | > loader_time: 0.61660  (0.47706)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.01201)
     | > avg_loss:[92m 0.83319 [0m(-0.01257)
     | > avg_log_mle:[92m -0.03097 [0m(-0.00652)
     | > avg_loss_dur:[92m 0.86415 [0m(-0.00605)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1152.pth

[4m[1m > EPOCH: 64/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:15:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06005 [0m(-0.00100)
     | > avg_loss:[92m 0.81277 [0m(-0.02041)
     | > avg_log_mle:[92m -0.03753 [0m(-0.00656)
     | > avg_loss_dur:[92m 0.85031 [0m(-0.01385)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1170.pth

[4m[1m > EPOCH: 65/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:15:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 1175[0m
     | > loss: 0.85474  (0.82281)
     | > log_mle: 0.01543  (-0.00154)
     | > loss_dur: 0.83931  (0.82435)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.92751  (1.96957)
     | > current_lr: 0.00002 
     | > step_time: 0.73770  (0.67021)
     | > loader_time: 0.43140  (0.41097)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06406 [0m(+0.00400)
     | > avg_loss:[92m 0.79130 [0m(-0.02147)
     | > avg_log_mle:[92m -0.04425 [0m(-0.00671)
     | > avg_loss_dur:[92m 0.83555 [0m(-0.01476)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1188.pth

[4m[1m > EPOCH: 66/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:16:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 1200[0m
     | > loss: 0.88553  (0.84306)
     | > log_mle: -0.00796  (-0.00716)
     | > loss_dur: 0.89349  (0.85022)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.04648  (1.97179)
     | > current_lr: 0.00002 
     | > step_time: 0.91580  (0.71056)
     | > loader_time: 0.58050  (0.45750)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00200)
     | > avg_loss:[92m 0.78698 [0m(-0.00433)
     | > avg_log_mle:[92m -0.05105 [0m(-0.00681)
     | > avg_loss_dur:[91m 0.83803 [0m(+0.00248)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1206.pth

[4m[1m > EPOCH: 67/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:16:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00100)
     | > avg_loss:[92m 0.77283 [0m(-0.01415)
     | > avg_log_mle:[92m -0.05749 [0m(-0.00644)
     | > avg_loss_dur:[92m 0.83032 [0m(-0.00771)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1224.pth

[4m[1m > EPOCH: 68/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:17:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 1225[0m
     | > loss: 0.76666  (0.76666)
     | > log_mle: -0.02158  (-0.02158)
     | > loss_dur: 0.78825  (0.78825)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.92508  (1.92508)
     | > current_lr: 0.00002 
     | > step_time: 0.64660  (0.64659)
     | > loader_time: 0.38130  (0.38135)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01101)
     | > avg_loss:[92m 0.75498 [0m(-0.01785)
     | > avg_log_mle:[92m -0.06396 [0m(-0.00646)
     | > avg_loss_dur:[92m 0.81893 [0m(-0.01139)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1242.pth

[4m[1m > EPOCH: 69/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:17:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 1250[0m
     | > loss: 0.81039  (0.77525)
     | > log_mle: -0.03091  (-0.02662)
     | > loss_dur: 0.84131  (0.80188)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.85566  (1.80165)
     | > current_lr: 0.00002 
     | > step_time: 0.67760  (0.66385)
     | > loader_time: 0.40540  (0.40812)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00901)
     | > avg_loss:[92m 0.73574 [0m(-0.01924)
     | > avg_log_mle:[92m -0.07107 [0m(-0.00711)
     | > avg_loss_dur:[92m 0.80681 [0m(-0.01213)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1260.pth

[4m[1m > EPOCH: 70/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:18:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 1275[0m
     | > loss: 0.80288  (0.78945)
     | > log_mle: -0.04079  (-0.03433)
     | > loss_dur: 0.84367  (0.82378)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.89671  (1.84535)
     | > current_lr: 0.00002 
     | > step_time: 0.86980  (0.74461)
     | > loader_time: 0.55750  (0.47076)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00000)
     | > avg_loss:[92m 0.72171 [0m(-0.01403)
     | > avg_log_mle:[92m -0.07819 [0m(-0.00713)
     | > avg_loss_dur:[92m 0.79990 [0m(-0.00691)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1278.pth

[4m[1m > EPOCH: 71/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:18:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00100)
     | > avg_loss:[92m 0.70366 [0m(-0.01805)
     | > avg_log_mle:[92m -0.08500 [0m(-0.00681)
     | > avg_loss_dur:[92m 0.78866 [0m(-0.01123)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1296.pth

[4m[1m > EPOCH: 72/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:19:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 1300[0m
     | > loss: 0.71617  (0.70429)
     | > log_mle: -0.04622  (-0.05269)
     | > loss_dur: 0.76239  (0.75697)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.66946  (1.65631)
     | > current_lr: 0.00002 
     | > step_time: 0.73170  (0.65560)
     | > loader_time: 0.47940  (0.40237)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00000)
     | > avg_loss:[92m 0.69586 [0m(-0.00779)
     | > avg_log_mle:[92m -0.09116 [0m(-0.00616)
     | > avg_loss_dur:[92m 0.78702 [0m(-0.00164)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1314.pth

[4m[1m > EPOCH: 73/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:19:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 1325[0m
     | > loss: 0.78473  (0.72862)
     | > log_mle: -0.05677  (-0.05475)
     | > loss_dur: 0.84150  (0.78337)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.82082  (1.71122)
     | > current_lr: 0.00002 
     | > step_time: 0.73370  (0.68844)
     | > loader_time: 0.45540  (0.44295)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00601)
     | > avg_loss:[92m 0.67763 [0m(-0.01824)
     | > avg_log_mle:[92m -0.09870 [0m(-0.00754)
     | > avg_loss_dur:[92m 0.77632 [0m(-0.01070)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1332.pth

[4m[1m > EPOCH: 74/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:20:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06306 [0m(+0.00100)
     | > avg_loss:[92m 0.66008 [0m(-0.01754)
     | > avg_log_mle:[92m -0.10535 [0m(-0.00665)
     | > avg_loss_dur:[92m 0.76544 [0m(-0.01089)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1350.pth

[4m[1m > EPOCH: 75/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:20:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 1350[0m
     | > loss: 0.71645  (0.71645)
     | > log_mle: -0.08201  (-0.08201)
     | > loss_dur: 0.79846  (0.79846)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.80498  (1.80498)
     | > current_lr: 0.00002 
     | > step_time: 0.66960  (0.66961)
     | > loader_time: 0.27620  (0.27625)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01101)
     | > avg_loss:[92m 0.64628 [0m(-0.01381)
     | > avg_log_mle:[92m -0.11220 [0m(-0.00685)
     | > avg_loss_dur:[92m 0.75848 [0m(-0.00696)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1368.pth

[4m[1m > EPOCH: 76/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:21:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 1375[0m
     | > loss: 0.69779  (0.67415)
     | > log_mle: -0.07969  (-0.07347)
     | > loss_dur: 0.77748  (0.74762)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.57642  (1.45318)
     | > current_lr: 0.00002 
     | > step_time: 0.64360  (0.66460)
     | > loader_time: 0.42640  (0.41652)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00701)
     | > avg_loss:[92m 0.64548 [0m(-0.00080)
     | > avg_log_mle:[92m -0.11854 [0m(-0.00634)
     | > avg_loss_dur:[91m 0.76402 [0m(+0.00554)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1386.pth

[4m[1m > EPOCH: 77/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:21:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 1400[0m
     | > loss: 0.75041  (0.69040)
     | > log_mle: -0.07637  (-0.08085)
     | > loss_dur: 0.82677  (0.77126)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.69881  (1.53600)
     | > current_lr: 0.00002 
     | > step_time: 1.02390  (0.73567)
     | > loader_time: 0.59750  (0.49345)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00100)
     | > avg_loss:[92m 0.62398 [0m(-0.02150)
     | > avg_log_mle:[92m -0.12492 [0m(-0.00638)
     | > avg_loss_dur:[92m 0.74890 [0m(-0.01512)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1404.pth

[4m[1m > EPOCH: 78/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:22:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 0.61828 [0m(-0.00569)
     | > avg_log_mle:[92m -0.13146 [0m(-0.00654)
     | > avg_loss_dur:[91m 0.74974 [0m(+0.00085)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1422.pth

[4m[1m > EPOCH: 79/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:22:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 1425[0m
     | > loss: 0.60278  (0.61205)
     | > log_mle: -0.09236  (-0.10021)
     | > loss_dur: 0.69514  (0.71226)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.25331  (1.37105)
     | > current_lr: 0.00002 
     | > step_time: 0.67760  (0.62490)
     | > loader_time: 0.41340  (0.37267)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00200)
     | > avg_loss:[92m 0.60366 [0m(-0.01463)
     | > avg_log_mle:[92m -0.13763 [0m(-0.00617)
     | > avg_loss_dur:[92m 0.74128 [0m(-0.00846)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1440.pth

[4m[1m > EPOCH: 80/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:23:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 1450[0m
     | > loss: 0.67533  (0.63551)
     | > log_mle: -0.10084  (-0.09917)
     | > loss_dur: 0.77617  (0.73468)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.50131  (1.42917)
     | > current_lr: 0.00002 
     | > step_time: 0.69760  (0.68693)
     | > loader_time: 0.47040  (0.45191)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00200)
     | > avg_loss:[92m 0.58966 [0m(-0.01400)
     | > avg_log_mle:[92m -0.14350 [0m(-0.00587)
     | > avg_loss_dur:[92m 0.73316 [0m(-0.00813)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1458.pth

[4m[1m > EPOCH: 81/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:23:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 1475[0m
     | > loss: 0.74030  (0.65339)
     | > log_mle: -0.10483  (-0.10526)
     | > loss_dur: 0.84512  (0.75865)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.66268  (1.49293)
     | > current_lr: 0.00002 
     | > step_time: 0.84280  (0.75993)
     | > loader_time: 0.38430  (0.47808)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00000)
     | > avg_loss:[92m 0.58168 [0m(-0.00797)
     | > avg_log_mle:[92m -0.14888 [0m(-0.00538)
     | > avg_loss_dur:[92m 0.73056 [0m(-0.00259)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1476.pth

[4m[1m > EPOCH: 82/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:24:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00100)
     | > avg_loss:[92m 0.57234 [0m(-0.00934)
     | > avg_log_mle:[92m -0.15479 [0m(-0.00591)
     | > avg_loss_dur:[92m 0.72713 [0m(-0.00343)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1494.pth

[4m[1m > EPOCH: 83/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:24:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 1500[0m
     | > loss: 0.62691  (0.58982)
     | > log_mle: -0.09775  (-0.11399)
     | > loss_dur: 0.72466  (0.70381)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.45410  (1.38901)
     | > current_lr: 0.00002 
     | > step_time: 0.63060  (0.66144)
     | > loader_time: 0.39240  (0.40220)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00200)
     | > avg_loss:[92m 0.56443 [0m(-0.00791)
     | > avg_log_mle:[92m -0.16024 [0m(-0.00544)
     | > avg_loss_dur:[92m 0.72467 [0m(-0.00246)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1512.pth

[4m[1m > EPOCH: 84/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:25:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 1525[0m
     | > loss: 0.68130  (0.61025)
     | > log_mle: -0.11706  (-0.12153)
     | > loss_dur: 0.79836  (0.73179)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.42776  (1.39662)
     | > current_lr: 0.00002 
     | > step_time: 0.77670  (0.71527)
     | > loader_time: 0.47540  (0.44941)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00801)
     | > avg_loss:[92m 0.55140 [0m(-0.01303)
     | > avg_log_mle:[92m -0.16493 [0m(-0.00470)
     | > avg_loss_dur:[92m 0.71633 [0m(-0.00834)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1530.pth

[4m[1m > EPOCH: 85/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:25:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.01001)
     | > avg_loss:[92m 0.54621 [0m(-0.00519)
     | > avg_log_mle:[92m -0.16918 [0m(-0.00424)
     | > avg_loss_dur:[92m 0.71539 [0m(-0.00094)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1548.pth

[4m[1m > EPOCH: 86/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:26:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 1550[0m
     | > loss: 0.54484  (0.54728)
     | > log_mle: -0.15129  (-0.14201)
     | > loss_dur: 0.69613  (0.68929)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.16877  (1.31703)
     | > current_lr: 0.00002 
     | > step_time: 0.56150  (0.60405)
     | > loader_time: 0.33030  (0.43039)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00500)
     | > avg_loss:[92m 0.53400 [0m(-0.01222)
     | > avg_log_mle:[92m -0.17387 [0m(-0.00469)
     | > avg_loss_dur:[92m 0.70786 [0m(-0.00753)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1566.pth

[4m[1m > EPOCH: 87/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:26:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 1575[0m
     | > loss: 0.58538  (0.56308)
     | > log_mle: -0.14057  (-0.13652)
     | > loss_dur: 0.72595  (0.69960)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.24290  (1.21117)
     | > current_lr: 0.00002 
     | > step_time: 0.86380  (0.68340)
     | > loader_time: 0.57050  (0.41827)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00100)
     | > avg_loss:[92m 0.53297 [0m(-0.00103)
     | > avg_log_mle:[92m -0.17899 [0m(-0.00512)
     | > avg_loss_dur:[91m 0.71196 [0m(+0.00409)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1584.pth

[4m[1m > EPOCH: 88/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:27:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 1600[0m
     | > loss: 0.60988  (0.58021)
     | > log_mle: -0.14145  (-0.14129)
     | > loss_dur: 0.75133  (0.72150)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.49697  (1.26618)
     | > current_lr: 0.00002 
     | > step_time: 0.94590  (0.75963)
     | > loader_time: 0.55850  (0.47925)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00000)
     | > avg_loss:[92m 0.52902 [0m(-0.00395)
     | > avg_log_mle:[92m -0.18370 [0m(-0.00471)
     | > avg_loss_dur:[91m 0.71272 [0m(+0.00076)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1602.pth

[4m[1m > EPOCH: 89/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:27:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00801)
     | > avg_loss:[92m 0.52244 [0m(-0.00658)
     | > avg_log_mle:[92m -0.18763 [0m(-0.00393)
     | > avg_loss_dur:[92m 0.71007 [0m(-0.00265)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1620.pth

[4m[1m > EPOCH: 90/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:28:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 1625[0m
     | > loss: 0.55839  (0.52527)
     | > log_mle: -0.13705  (-0.15140)
     | > loss_dur: 0.69544  (0.67667)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.52778  (1.38682)
     | > current_lr: 0.00002 
     | > step_time: 0.73970  (0.67101)
     | > loader_time: 0.44640  (0.41518)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00601)
     | > avg_loss:[92m 0.51239 [0m(-0.01006)
     | > avg_log_mle:[92m -0.19152 [0m(-0.00389)
     | > avg_loss_dur:[92m 0.70390 [0m(-0.00617)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1638.pth

[4m[1m > EPOCH: 91/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:28:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 1650[0m
     | > loss: 0.58816  (0.54858)
     | > log_mle: -0.15761  (-0.15535)
     | > loss_dur: 0.74577  (0.70393)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.36118  (1.36818)
     | > current_lr: 0.00002 
     | > step_time: 0.90280  (0.70556)
     | > loader_time: 0.64460  (0.45216)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[92m 0.51104 [0m(-0.00134)
     | > avg_log_mle:[92m -0.19402 [0m(-0.00251)
     | > avg_loss_dur:[91m 0.70507 [0m(+0.00116)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1656.pth

[4m[1m > EPOCH: 92/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:29:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06605 [0m(-0.00201)
     | > avg_loss:[92m 0.49949 [0m(-0.01155)
     | > avg_log_mle:[92m -0.19874 [0m(-0.00471)
     | > avg_loss_dur:[92m 0.69823 [0m(-0.00684)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1674.pth

[4m[1m > EPOCH: 93/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:29:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 1675[0m
     | > loss: 0.50733  (0.50733)
     | > log_mle: -0.16366  (-0.16366)
     | > loss_dur: 0.67099  (0.67099)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.26631  (1.26631)
     | > current_lr: 0.00002 
     | > step_time: 0.64460  (0.64459)
     | > loader_time: 0.38430  (0.38435)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06905 [0m(+0.00300)
     | > avg_loss:[92m 0.48728 [0m(-0.01221)
     | > avg_log_mle:[92m -0.20348 [0m(-0.00474)
     | > avg_loss_dur:[92m 0.69076 [0m(-0.00747)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1692.pth

[4m[1m > EPOCH: 94/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:30:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 1700[0m
     | > loss: 0.53485  (0.51426)
     | > log_mle: -0.17251  (-0.16739)
     | > loss_dur: 0.70735  (0.68165)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.05982  (1.23543)
     | > current_lr: 0.00002 
     | > step_time: 0.67660  (0.66348)
     | > loader_time: 0.41640  (0.40687)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00599)
     | > avg_loss:[92m 0.48167 [0m(-0.00561)
     | > avg_log_mle:[92m -0.20562 [0m(-0.00215)
     | > avg_loss_dur:[92m 0.68729 [0m(-0.00347)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1710.pth

[4m[1m > EPOCH: 95/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:30:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 1725[0m
     | > loss: 0.55319  (0.53490)
     | > log_mle: -0.17472  (-0.17083)
     | > loss_dur: 0.72791  (0.70572)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.00467  (1.21472)
     | > current_lr: 0.00002 
     | > step_time: 0.86880  (0.74281)
     | > loader_time: 0.52150  (0.47076)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06506 [0m(+0.00200)
     | > avg_loss:[91m 0.48969 [0m(+0.00803)
     | > avg_log_mle:[92m -0.21057 [0m(-0.00494)
     | > avg_loss_dur:[91m 0.70026 [0m(+0.01297)


[4m[1m > EPOCH: 96/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:31:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00000)
     | > avg_loss:[92m 0.47323 [0m(-0.01646)
     | > avg_log_mle:[92m -0.21406 [0m(-0.00349)
     | > avg_loss_dur:[92m 0.68729 [0m(-0.01297)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1746.pth

[4m[1m > EPOCH: 97/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:31:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 1750[0m
     | > loss: 0.48647  (0.47320)
     | > log_mle: -0.18002  (-0.18416)
     | > loss_dur: 0.66649  (0.65737)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 0.90637  (0.94876)
     | > current_lr: 0.00002 
     | > step_time: 0.72470  (0.65109)
     | > loader_time: 0.47940  (0.40011)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00601)
     | > avg_loss:[92m 0.46938 [0m(-0.00385)
     | > avg_log_mle:[92m -0.21827 [0m(-0.00421)
     | > avg_loss_dur:[91m 0.68765 [0m(+0.00036)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1764.pth

[4m[1m > EPOCH: 98/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:32:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 1775[0m
     | > loss: 0.55723  (0.50424)
     | > log_mle: -0.18540  (-0.18333)
     | > loss_dur: 0.74264  (0.68758)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 0.82250  (1.08157)
     | > current_lr: 0.00002 
     | > step_time: 0.73570  (0.69018)
     | > loader_time: 0.46640  (0.44577)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00000)
     | > avg_loss:[91m 0.47471 [0m(+0.00533)
     | > avg_log_mle:[92m -0.22097 [0m(-0.00270)
     | > avg_loss_dur:[91m 0.69568 [0m(+0.00803)


[4m[1m > EPOCH: 99/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:32:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00901)
     | > avg_loss:[92m 0.46589 [0m(-0.00882)
     | > avg_log_mle:[92m -0.22384 [0m(-0.00287)
     | > avg_loss_dur:[92m 0.68973 [0m(-0.00595)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1800.pth

[4m[1m > EPOCH: 100/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:33:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 1800[0m
     | > loss: 0.48381  (0.48381)
     | > log_mle: -0.20343  (-0.20343)
     | > loss_dur: 0.68723  (0.68723)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.58908  (1.58908)
     | > current_lr: 0.00002 
     | > step_time: 0.49440  (0.49445)
     | > loader_time: 0.28120  (0.28124)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00000)
     | > avg_loss:[91m 0.46665 [0m(+0.00076)
     | > avg_log_mle:[92m -0.22788 [0m(-0.00405)
     | > avg_loss_dur:[91m 0.69453 [0m(+0.00481)


[4m[1m > EPOCH: 101/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:33:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 1825[0m
     | > loss: 0.48218  (0.47535)
     | > log_mle: -0.19898  (-0.19255)
     | > loss_dur: 0.68116  (0.66790)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 0.99592  (1.03487)
     | > current_lr: 0.00003 
     | > step_time: 0.65160  (0.66046)
     | > loader_time: 0.41840  (0.41051)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00400)
     | > avg_loss:[92m 0.45567 [0m(-0.01098)
     | > avg_log_mle:[92m -0.23055 [0m(-0.00267)
     | > avg_loss_dur:[92m 0.68623 [0m(-0.00831)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1836.pth

[4m[1m > EPOCH: 102/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:34:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 1850[0m
     | > loss: 0.55230  (0.49796)
     | > log_mle: -0.18898  (-0.19638)
     | > loss_dur: 0.74128  (0.69433)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.42540  (1.10817)
     | > current_lr: 0.00003 
     | > step_time: 1.01090  (0.73760)
     | > loader_time: 0.61160  (0.47128)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00801)
     | > avg_loss:[92m 0.45235 [0m(-0.00332)
     | > avg_log_mle:[92m -0.23367 [0m(-0.00311)
     | > avg_loss_dur:[92m 0.68602 [0m(-0.00021)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1854.pth

[4m[1m > EPOCH: 103/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:34:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00901)
     | > avg_loss:[92m 0.44597 [0m(-0.00638)
     | > avg_log_mle:[92m -0.23523 [0m(-0.00156)
     | > avg_loss_dur:[92m 0.68119 [0m(-0.00482)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1872.pth

[4m[1m > EPOCH: 104/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:35:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 1875[0m
     | > loss: 0.44085  (0.44355)
     | > log_mle: -0.20446  (-0.21004)
     | > loss_dur: 0.64531  (0.65359)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.05136  (1.26577)
     | > current_lr: 0.00003 
     | > step_time: 0.68460  (0.63024)
     | > loader_time: 0.60350  (0.45007)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00701)
     | > avg_loss:[92m 0.43375 [0m(-0.01222)
     | > avg_log_mle:[92m -0.24111 [0m(-0.00588)
     | > avg_loss_dur:[92m 0.67486 [0m(-0.00634)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1890.pth

[4m[1m > EPOCH: 105/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:36:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 1900[0m
     | > loss: 0.50874  (0.47000)
     | > log_mle: -0.20349  (-0.20745)
     | > loss_dur: 0.71223  (0.67745)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 0.99732  (1.30295)
     | > current_lr: 0.00003 
     | > step_time: 0.69660  (0.68542)
     | > loader_time: 0.43840  (0.42288)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00000)
     | > avg_loss:[92m 0.42977 [0m(-0.00398)
     | > avg_log_mle:[92m -0.24224 [0m(-0.00113)
     | > avg_loss_dur:[92m 0.67200 [0m(-0.00286)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1908.pth

[4m[1m > EPOCH: 106/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:36:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 1925[0m
     | > loss: 0.57656  (0.48993)
     | > log_mle: -0.20846  (-0.20957)
     | > loss_dur: 0.78503  (0.69950)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.21584  (1.31008)
     | > current_lr: 0.00003 
     | > step_time: 0.83980  (0.75981)
     | > loader_time: 0.42240  (0.48856)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.43336 [0m(+0.00360)
     | > avg_log_mle:[92m -0.24478 [0m(-0.00254)
     | > avg_loss_dur:[91m 0.67814 [0m(+0.00614)


[4m[1m > EPOCH: 107/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:37:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00501)
     | > avg_loss:[92m 0.41795 [0m(-0.01541)
     | > avg_log_mle:[92m -0.24916 [0m(-0.00438)
     | > avg_loss_dur:[92m 0.66711 [0m(-0.01103)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_1944.pth

[4m[1m > EPOCH: 108/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:37:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 1950[0m
     | > loss: 0.48164  (0.44643)
     | > log_mle: -0.19944  (-0.21470)
     | > loss_dur: 0.68108  (0.66113)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.31703  (1.54149)
     | > current_lr: 0.00003 
     | > step_time: 0.63760  (0.66444)
     | > loader_time: 0.37530  (0.40520)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[91m 0.42289 [0m(+0.00494)
     | > avg_log_mle:[92m -0.24959 [0m(-0.00043)
     | > avg_loss_dur:[91m 0.67247 [0m(+0.00536)


[4m[1m > EPOCH: 109/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:38:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 1975[0m
     | > loss: 0.52616  (0.46959)
     | > log_mle: -0.21424  (-0.21961)
     | > loss_dur: 0.74040  (0.68921)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.23225  (1.53901)
     | > current_lr: 0.00003 
     | > step_time: 0.77770  (0.71280)
     | > loader_time: 0.51750  (0.45672)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00100)
     | > avg_loss:[92m 0.42010 [0m(-0.00279)
     | > avg_log_mle:[92m -0.25445 [0m(-0.00486)
     | > avg_loss_dur:[91m 0.67455 [0m(+0.00208)


[4m[1m > EPOCH: 110/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:38:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.01001)
     | > avg_loss:[91m 0.42102 [0m(+0.00092)
     | > avg_log_mle:[92m -0.25777 [0m(-0.00332)
     | > avg_loss_dur:[91m 0.67879 [0m(+0.00424)


[4m[1m > EPOCH: 111/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:39:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 2000[0m
     | > loss: 0.43193  (0.42902)
     | > log_mle: -0.24054  (-0.23306)
     | > loss_dur: 0.67247  (0.66208)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 1.45000  (1.56930)
     | > current_lr: 0.00003 
     | > step_time: 0.55650  (0.60205)
     | > loader_time: 0.33130  (0.36984)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00801)
     | > avg_loss:[92m 0.41180 [0m(-0.00922)
     | > avg_log_mle:[92m -0.25903 [0m(-0.00126)
     | > avg_loss_dur:[92m 0.67083 [0m(-0.00796)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2016.pth

[4m[1m > EPOCH: 112/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:39:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 2025[0m
     | > loss: 0.46082  (0.44157)
     | > log_mle: -0.23225  (-0.22853)
     | > loss_dur: 0.69307  (0.67010)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.18335  (1.80630)
     | > current_lr: 0.00003 
     | > step_time: 0.86680  (0.68440)
     | > loader_time: 0.54350  (0.42283)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00901)
     | > avg_loss:[91m 0.41786 [0m(+0.00606)
     | > avg_log_mle:[92m -0.25908 [0m(-0.00005)
     | > avg_loss_dur:[91m 0.67694 [0m(+0.00611)


[4m[1m > EPOCH: 113/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:40:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 2050[0m
     | > loss: 0.48932  (0.46217)
     | > log_mle: -0.22636  (-0.23022)
     | > loss_dur: 0.71569  (0.69239)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.66536  (1.63105)
     | > current_lr: 0.00003 
     | > step_time: 0.94490  (0.75663)
     | > loader_time: 0.59550  (0.49076)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[91m 0.41964 [0m(+0.00178)
     | > avg_log_mle:[92m -0.26370 [0m(-0.00463)
     | > avg_loss_dur:[91m 0.68335 [0m(+0.00641)


[4m[1m > EPOCH: 114/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:40:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00701)
     | > avg_loss:[92m 0.41709 [0m(-0.00255)
     | > avg_log_mle:[91m -0.26353 [0m(+0.00017)
     | > avg_loss_dur:[92m 0.68062 [0m(-0.00273)


[4m[1m > EPOCH: 115/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:41:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 2075[0m
     | > loss: 0.44903  (0.42168)
     | > log_mle: -0.22588  (-0.23743)
     | > loss_dur: 0.67490  (0.65911)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.60928  (1.64691)
     | > current_lr: 0.00003 
     | > step_time: 0.73970  (0.67081)
     | > loader_time: 0.45240  (0.42178)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06406 [0m(+0.00200)
     | > avg_loss:[92m 0.41330 [0m(-0.00379)
     | > avg_log_mle:[92m -0.26933 [0m(-0.00580)
     | > avg_loss_dur:[91m 0.68263 [0m(+0.00201)


[4m[1m > EPOCH: 116/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:41:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 2100[0m
     | > loss: 0.47387  (0.44067)
     | > log_mle: -0.24083  (-0.23917)
     | > loss_dur: 0.71470  (0.67984)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.93342  (1.61529)
     | > current_lr: 0.00003 
     | > step_time: 0.90080  (0.70639)
     | > loader_time: 0.63060  (0.45775)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00901)
     | > avg_loss:[92m 0.39663 [0m(-0.01667)
     | > avg_log_mle:[92m -0.27264 [0m(-0.00331)
     | > avg_loss_dur:[92m 0.66927 [0m(-0.01336)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2106.pth

[4m[1m > EPOCH: 117/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:42:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00300)
     | > avg_loss:[92m 0.39518 [0m(-0.00144)
     | > avg_log_mle:[92m -0.27428 [0m(-0.00164)
     | > avg_loss_dur:[91m 0.66946 [0m(+0.00019)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2124.pth

[4m[1m > EPOCH: 118/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:42:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 2125[0m
     | > loss: 0.40976  (0.40976)
     | > log_mle: -0.24416  (-0.24416)
     | > loss_dur: 0.65392  (0.65392)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.47251  (1.47251)
     | > current_lr: 0.00003 
     | > step_time: 0.64860  (0.64859)
     | > loader_time: 0.53450  (0.53449)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00400)
     | > avg_loss:[91m 0.39788 [0m(+0.00270)
     | > avg_log_mle:[91m -0.27374 [0m(+0.00054)
     | > avg_loss_dur:[91m 0.67162 [0m(+0.00216)


[4m[1m > EPOCH: 119/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:43:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 2150[0m
     | > loss: 0.42784  (0.41052)
     | > log_mle: -0.25148  (-0.24569)
     | > loss_dur: 0.67931  (0.65621)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.00109  (1.87172)
     | > current_lr: 0.00003 
     | > step_time: 0.67260  (0.65948)
     | > loader_time: 0.39940  (0.40074)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[92m 0.39786 [0m(-0.00002)
     | > avg_log_mle:[92m -0.27685 [0m(-0.00312)
     | > avg_loss_dur:[91m 0.67471 [0m(+0.00309)


[4m[1m > EPOCH: 120/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:43:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 2175[0m
     | > loss: 0.44381  (0.43138)
     | > log_mle: -0.24854  (-0.24744)
     | > loss_dur: 0.69234  (0.67882)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.27345  (1.91173)
     | > current_lr: 0.00003 
     | > step_time: 0.87080  (0.74709)
     | > loader_time: 0.52850  (0.46208)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.00300)
     | > avg_loss:[91m 0.41021 [0m(+0.01235)
     | > avg_log_mle:[92m -0.27695 [0m(-0.00009)
     | > avg_loss_dur:[91m 0.68716 [0m(+0.01244)


[4m[1m > EPOCH: 121/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:44:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.01802)
     | > avg_loss:[92m 0.39680 [0m(-0.01341)
     | > avg_log_mle:[92m -0.28114 [0m(-0.00419)
     | > avg_loss_dur:[92m 0.67794 [0m(-0.00922)


[4m[1m > EPOCH: 122/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:44:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 2200[0m
     | > loss: 0.38536  (0.37709)
     | > log_mle: -0.25493  (-0.25839)
     | > loss_dur: 0.64029  (0.63547)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.09991  (1.64208)
     | > current_lr: 0.00003 
     | > step_time: 0.72570  (0.65335)
     | > loader_time: 0.48740  (0.40762)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01301)
     | > avg_loss:[92m 0.39094 [0m(-0.00586)
     | > avg_log_mle:[92m -0.28353 [0m(-0.00239)
     | > avg_loss_dur:[92m 0.67448 [0m(-0.00346)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2214.pth

[4m[1m > EPOCH: 123/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:45:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 2225[0m
     | > loss: 0.43476  (0.39246)
     | > log_mle: -0.25820  (-0.25615)
     | > loss_dur: 0.69296  (0.64861)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.64914  (1.62018)
     | > current_lr: 0.00003 
     | > step_time: 0.72670  (0.68726)
     | > loader_time: 0.43840  (0.42011)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00701)
     | > avg_loss:[92m 0.38283 [0m(-0.00811)
     | > avg_log_mle:[92m -0.28563 [0m(-0.00209)
     | > avg_loss_dur:[92m 0.66846 [0m(-0.00602)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2232.pth

[4m[1m > EPOCH: 124/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:45:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00601)
     | > avg_loss:[92m 0.35337 [0m(-0.02946)
     | > avg_log_mle:[92m -0.28856 [0m(-0.00294)
     | > avg_loss_dur:[92m 0.64193 [0m(-0.02653)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2250.pth

[4m[1m > EPOCH: 125/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:46:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 2250[0m
     | > loss: 0.35741  (0.35741)
     | > log_mle: -0.27471  (-0.27471)
     | > loss_dur: 0.63212  (0.63212)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.43068  (1.43068)
     | > current_lr: 0.00003 
     | > step_time: 0.64960  (0.64959)
     | > loader_time: 0.28430  (0.28426)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00500)
     | > avg_loss:[92m 0.34688 [0m(-0.00649)
     | > avg_log_mle:[92m -0.29224 [0m(-0.00368)
     | > avg_loss_dur:[92m 0.63912 [0m(-0.00281)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2268.pth

[4m[1m > EPOCH: 126/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:46:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 2275[0m
     | > loss: 0.34916  (0.35394)
     | > log_mle: -0.26764  (-0.26185)
     | > loss_dur: 0.61680  (0.61579)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.89636  (1.79346)
     | > current_lr: 0.00003 
     | > step_time: 0.64860  (0.66089)
     | > loader_time: 0.38940  (0.40580)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00000)
     | > avg_loss:[91m 0.35003 [0m(+0.00315)
     | > avg_log_mle:[91m -0.29179 [0m(+0.00045)
     | > avg_loss_dur:[91m 0.64182 [0m(+0.00270)


[4m[1m > EPOCH: 127/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:47:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 2300[0m
     | > loss: 0.43175  (0.37364)
     | > log_mle: -0.25518  (-0.26355)
     | > loss_dur: 0.68694  (0.63719)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.75053  (2.01677)
     | > current_lr: 0.00003 
     | > step_time: 1.00790  (0.73160)
     | > loader_time: 0.64060  (0.45320)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07306 [0m(+0.00500)
     | > avg_loss:[92m 0.33155 [0m(-0.01848)
     | > avg_log_mle:[92m -0.29676 [0m(-0.00496)
     | > avg_loss_dur:[92m 0.62831 [0m(-0.01351)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2304.pth

[4m[1m > EPOCH: 128/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:47:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.01101)
     | > avg_loss:[92m 0.32598 [0m(-0.00558)
     | > avg_log_mle:[92m -0.29803 [0m(-0.00128)
     | > avg_loss_dur:[92m 0.62401 [0m(-0.00430)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2322.pth

[4m[1m > EPOCH: 129/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:48:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 2325[0m
     | > loss: 0.32563  (0.33422)
     | > log_mle: -0.26961  (-0.27413)
     | > loss_dur: 0.59524  (0.60835)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.69720  (2.10815)
     | > current_lr: 0.00003 
     | > step_time: 0.67860  (0.62724)
     | > loader_time: 0.41140  (0.36500)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06206 [0m(+0.00000)
     | > avg_loss:[91m 0.32635 [0m(+0.00038)
     | > avg_log_mle:[92m -0.29821 [0m(-0.00018)
     | > avg_loss_dur:[91m 0.62456 [0m(+0.00056)


[4m[1m > EPOCH: 130/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:48:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 2350[0m
     | > loss: 0.37517  (0.33871)
     | > log_mle: -0.26302  (-0.27058)
     | > loss_dur: 0.63819  (0.60929)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.96295  (2.01950)
     | > current_lr: 0.00003 
     | > step_time: 0.69160  (0.68232)
     | > loader_time: 0.42840  (0.42559)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.01001)
     | > avg_loss:[92m 0.31752 [0m(-0.00883)
     | > avg_log_mle:[92m -0.30119 [0m(-0.00298)
     | > avg_loss_dur:[92m 0.61871 [0m(-0.00585)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2358.pth

[4m[1m > EPOCH: 131/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:49:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 2375[0m
     | > loss: 0.41275  (0.35383)
     | > log_mle: -0.27039  (-0.27165)
     | > loss_dur: 0.68314  (0.62547)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.35155  (2.07803)
     | > current_lr: 0.00003 
     | > step_time: 0.83980  (0.76191)
     | > loader_time: 0.43040  (0.47508)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00300)
     | > avg_loss:[91m 0.32237 [0m(+0.00484)
     | > avg_log_mle:[92m -0.30288 [0m(-0.00170)
     | > avg_loss_dur:[91m 0.62525 [0m(+0.00654)


[4m[1m > EPOCH: 132/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:49:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00100)
     | > avg_loss:[92m 0.31539 [0m(-0.00697)
     | > avg_log_mle:[92m -0.30397 [0m(-0.00109)
     | > avg_loss_dur:[92m 0.61937 [0m(-0.00588)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2394.pth

[4m[1m > EPOCH: 133/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:50:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 2400[0m
     | > loss: 0.32291  (0.32001)
     | > log_mle: -0.25953  (-0.27448)
     | > loss_dur: 0.58244  (0.59449)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.71495  (2.30725)
     | > current_lr: 0.00003 
     | > step_time: 0.64160  (0.66444)
     | > loader_time: 0.37230  (0.40503)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08007 [0m(+0.01201)
     | > avg_loss:[91m 0.33212 [0m(+0.01673)
     | > avg_log_mle:[92m -0.30471 [0m(-0.00073)
     | > avg_loss_dur:[91m 0.63683 [0m(+0.01746)


[4m[1m > EPOCH: 134/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:50:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 2425[0m
     | > loss: 0.36410  (0.32564)
     | > log_mle: -0.27296  (-0.27857)
     | > loss_dur: 0.63706  (0.60421)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.15700  (1.78673)
     | > current_lr: 0.00003 
     | > step_time: 0.77870  (0.71149)
     | > loader_time: 0.50050  (0.45996)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.01101)
     | > avg_loss:[92m 0.31022 [0m(-0.02190)
     | > avg_log_mle:[92m -0.30869 [0m(-0.00399)
     | > avg_loss_dur:[92m 0.61891 [0m(-0.01791)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2430.pth

[4m[1m > EPOCH: 135/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:51:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00100)
     | > avg_loss:[92m 0.29829 [0m(-0.01193)
     | > avg_log_mle:[92m -0.31086 [0m(-0.00217)
     | > avg_loss_dur:[92m 0.60916 [0m(-0.00976)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2448.pth

[4m[1m > EPOCH: 136/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:52:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 2450[0m
     | > loss: 0.30516  (0.30083)
     | > log_mle: -0.29596  (-0.28941)
     | > loss_dur: 0.60112  (0.59024)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.37033  (2.35888)
     | > current_lr: 0.00003 
     | > step_time: 0.55350  (0.60105)
     | > loader_time: 0.33430  (0.35231)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00300)
     | > avg_loss:[91m 0.30359 [0m(+0.00529)
     | > avg_log_mle:[92m -0.31146 [0m(-0.00060)
     | > avg_loss_dur:[91m 0.61505 [0m(+0.00589)


[4m[1m > EPOCH: 137/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:52:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 2475[0m
     | > loss: 0.33036  (0.30229)
     | > log_mle: -0.28698  (-0.28521)
     | > loss_dur: 0.61734  (0.58749)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.47865  (2.01557)
     | > current_lr: 0.00003 
     | > step_time: 0.86480  (0.68318)
     | > loader_time: 0.54450  (0.43540)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00400)
     | > avg_loss:[92m 0.29640 [0m(-0.00719)
     | > avg_log_mle:[92m -0.31425 [0m(-0.00279)
     | > avg_loss_dur:[92m 0.61065 [0m(-0.00440)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2484.pth

[4m[1m > EPOCH: 138/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:53:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 2500[0m
     | > loss: 0.36431  (0.32001)
     | > log_mle: -0.27837  (-0.28442)
     | > loss_dur: 0.64268  (0.60443)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.00911  (2.05921)
     | > current_lr: 0.00003 
     | > step_time: 0.95090  (0.76026)
     | > loader_time: 0.55350  (0.47668)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[91m 0.29875 [0m(+0.00235)
     | > avg_log_mle:[92m -0.31624 [0m(-0.00199)
     | > avg_loss_dur:[91m 0.61500 [0m(+0.00435)


[4m[1m > EPOCH: 139/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:53:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[92m 0.29247 [0m(-0.00628)
     | > avg_log_mle:[91m -0.31557 [0m(+0.00068)
     | > avg_loss_dur:[92m 0.60804 [0m(-0.00696)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2520.pth

[4m[1m > EPOCH: 140/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:54:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 2525[0m
     | > loss: 0.29355  (0.28483)
     | > log_mle: -0.28056  (-0.29072)
     | > loss_dur: 0.57410  (0.57555)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 5.01078  (3.06392)
     | > current_lr: 0.00004 
     | > step_time: 0.74070  (0.67121)
     | > loader_time: 0.45640  (0.41778)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00500)
     | > avg_loss:[92m 0.28776 [0m(-0.00471)
     | > avg_log_mle:[92m -0.31624 [0m(-0.00068)
     | > avg_loss_dur:[92m 0.60401 [0m(-0.00403)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2538.pth

[4m[1m > EPOCH: 141/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:54:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 2550[0m
     | > loss: 0.33030  (0.29275)
     | > log_mle: -0.29325  (-0.29198)
     | > loss_dur: 0.62354  (0.58474)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.72865  (2.43292)
     | > current_lr: 0.00004 
     | > step_time: 0.90280  (0.70648)
     | > loader_time: 0.59050  (0.44215)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00801)
     | > avg_loss:[92m 0.28366 [0m(-0.00410)
     | > avg_log_mle:[92m -0.31706 [0m(-0.00082)
     | > avg_loss_dur:[92m 0.60072 [0m(-0.00328)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2556.pth

[4m[1m > EPOCH: 142/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:55:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00200)
     | > avg_loss:[91m 0.29667 [0m(+0.01300)
     | > avg_log_mle:[92m -0.31984 [0m(-0.00278)
     | > avg_loss_dur:[91m 0.61651 [0m(+0.01578)


[4m[1m > EPOCH: 143/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:55:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 2575[0m
     | > loss: 0.26792  (0.26792)
     | > log_mle: -0.29602  (-0.29602)
     | > loss_dur: 0.56394  (0.56394)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.32845  (2.32845)
     | > current_lr: 0.00004 
     | > step_time: 0.64560  (0.64559)
     | > loader_time: 0.35530  (0.35532)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00100)
     | > avg_loss:[92m 0.29254 [0m(-0.00412)
     | > avg_log_mle:[92m -0.32286 [0m(-0.00302)
     | > avg_loss_dur:[92m 0.61540 [0m(-0.00111)


[4m[1m > EPOCH: 144/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:56:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 2600[0m
     | > loss: 0.27186  (0.26764)
     | > log_mle: -0.30332  (-0.29703)
     | > loss_dur: 0.57518  (0.56467)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.80182  (2.47886)
     | > current_lr: 0.00004 
     | > step_time: 0.67560  (0.66223)
     | > loader_time: 0.44740  (0.41087)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00200)
     | > avg_loss:[92m 0.28013 [0m(-0.01241)
     | > avg_log_mle:[92m -0.32431 [0m(-0.00145)
     | > avg_loss_dur:[92m 0.60444 [0m(-0.01096)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2610.pth

[4m[1m > EPOCH: 145/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:56:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 2625[0m
     | > loss: 0.31030  (0.28998)
     | > log_mle: -0.29597  (-0.29743)
     | > loss_dur: 0.60627  (0.58741)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.02407  (2.66828)
     | > current_lr: 0.00004 
     | > step_time: 0.86780  (0.74354)
     | > loader_time: 0.53550  (0.47897)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00901)
     | > avg_loss:[91m 0.28380 [0m(+0.00368)
     | > avg_log_mle:[91m -0.32412 [0m(+0.00018)
     | > avg_loss_dur:[91m 0.60793 [0m(+0.00349)


[4m[1m > EPOCH: 146/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:57:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06306 [0m(+0.00000)
     | > avg_loss:[91m 0.28486 [0m(+0.00106)
     | > avg_log_mle:[92m -0.32653 [0m(-0.00241)
     | > avg_loss_dur:[91m 0.61139 [0m(+0.00346)


[4m[1m > EPOCH: 147/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:57:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 2650[0m
     | > loss: 0.26863  (0.26001)
     | > log_mle: -0.30278  (-0.30554)
     | > loss_dur: 0.57141  (0.56555)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.95636  (2.14669)
     | > current_lr: 0.00004 
     | > step_time: 0.72570  (0.65059)
     | > loader_time: 0.49850  (0.41438)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00601)
     | > avg_loss:[92m 0.25003 [0m(-0.03483)
     | > avg_log_mle:[92m -0.32851 [0m(-0.00198)
     | > avg_loss_dur:[92m 0.57854 [0m(-0.03285)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2664.pth

[4m[1m > EPOCH: 148/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:58:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 2675[0m
     | > loss: 0.28731  (0.26794)
     | > log_mle: -0.30462  (-0.30293)
     | > loss_dur: 0.59193  (0.57087)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.75134  (2.64120)
     | > current_lr: 0.00004 
     | > step_time: 0.73670  (0.69172)
     | > loader_time: 0.48740  (0.43685)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00300)
     | > avg_loss:[91m 0.27048 [0m(+0.02045)
     | > avg_log_mle:[91m -0.32649 [0m(+0.00202)
     | > avg_loss_dur:[91m 0.59697 [0m(+0.01843)


[4m[1m > EPOCH: 149/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:58:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01201)
     | > avg_loss:[92m 0.26610 [0m(-0.00438)
     | > avg_log_mle:[92m -0.33162 [0m(-0.00513)
     | > avg_loss_dur:[91m 0.59772 [0m(+0.00075)


[4m[1m > EPOCH: 150/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:59:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 2700[0m
     | > loss: 0.24867  (0.24867)
     | > log_mle: -0.32058  (-0.32058)
     | > loss_dur: 0.56924  (0.56924)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.56420  (3.56420)
     | > current_lr: 0.00004 
     | > step_time: 0.49350  (0.49345)
     | > loader_time: 0.27630  (0.27625)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00901)
     | > avg_loss:[91m 0.26869 [0m(+0.00259)
     | > avg_log_mle:[91m -0.33146 [0m(+0.00016)
     | > avg_loss_dur:[91m 0.60015 [0m(+0.00242)


[4m[1m > EPOCH: 151/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 05:59:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 2725[0m
     | > loss: 0.25488  (0.24756)
     | > log_mle: -0.31124  (-0.30672)
     | > loss_dur: 0.56612  (0.55428)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.61242  (2.70631)
     | > current_lr: 0.00004 
     | > step_time: 0.64260  (0.65960)
     | > loader_time: 0.41940  (0.40980)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00100)
     | > avg_loss:[91m 0.27127 [0m(+0.00258)
     | > avg_log_mle:[92m -0.33356 [0m(-0.00210)
     | > avg_loss_dur:[91m 0.60483 [0m(+0.00469)


[4m[1m > EPOCH: 152/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:00:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 2750[0m
     | > loss: 0.32760  (0.26546)
     | > log_mle: -0.29811  (-0.30826)
     | > loss_dur: 0.62571  (0.57372)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.50617  (2.65382)
     | > current_lr: 0.00004 
     | > step_time: 1.01390  (0.73488)
     | > loader_time: 0.60250  (0.48494)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[92m 0.26095 [0m(-0.01032)
     | > avg_log_mle:[91m -0.33266 [0m(+0.00091)
     | > avg_loss_dur:[92m 0.59361 [0m(-0.01123)


[4m[1m > EPOCH: 153/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:00:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00601)
     | > avg_loss:[91m 0.26606 [0m(+0.00511)
     | > avg_log_mle:[92m -0.33873 [0m(-0.00608)
     | > avg_loss_dur:[91m 0.60479 [0m(+0.01118)


[4m[1m > EPOCH: 154/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:01:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 2775[0m
     | > loss: 0.23417  (0.23855)
     | > log_mle: -0.31329  (-0.31556)
     | > loss_dur: 0.54747  (0.55411)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.89947  (5.34545)
     | > current_lr: 0.00004 
     | > step_time: 0.68360  (0.63224)
     | > loader_time: 0.42640  (0.37601)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06306 [0m(+0.00100)
     | > avg_loss:[92m 0.25232 [0m(-0.01374)
     | > avg_log_mle:[92m -0.34051 [0m(-0.00178)
     | > avg_loss_dur:[92m 0.59283 [0m(-0.01196)


[4m[1m > EPOCH: 155/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:01:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 2800[0m
     | > loss: 0.28153  (0.24275)
     | > log_mle: -0.30364  (-0.31393)
     | > loss_dur: 0.58517  (0.55668)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.80910  (2.48374)
     | > current_lr: 0.00004 
     | > step_time: 0.69860  (0.68533)
     | > loader_time: 0.45940  (0.43950)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00701)
     | > avg_loss:[91m 0.25541 [0m(+0.00309)
     | > avg_log_mle:[92m -0.34221 [0m(-0.00170)
     | > avg_loss_dur:[91m 0.59762 [0m(+0.00479)


[4m[1m > EPOCH: 156/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:02:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 2825[0m
     | > loss: 0.30841  (0.26010)
     | > log_mle: -0.31260  (-0.31319)
     | > loss_dur: 0.62101  (0.57329)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.23244  (3.13565)
     | > current_lr: 0.00004 
     | > step_time: 0.83880  (0.76337)
     | > loader_time: 0.45140  (0.48114)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00700)
     | > avg_loss:[91m 0.25644 [0m(+0.00103)
     | > avg_log_mle:[92m -0.34231 [0m(-0.00010)
     | > avg_loss_dur:[91m 0.59875 [0m(+0.00113)


[4m[1m > EPOCH: 157/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:02:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00100)
     | > avg_loss:[92m 0.24874 [0m(-0.00769)
     | > avg_log_mle:[92m -0.34330 [0m(-0.00099)
     | > avg_loss_dur:[92m 0.59204 [0m(-0.00671)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2844.pth

[4m[1m > EPOCH: 158/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:03:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 2850[0m
     | > loss: 0.23913  (0.22405)
     | > log_mle: -0.30319  (-0.31739)
     | > loss_dur: 0.54232  (0.54143)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.28450  (1.92037)
     | > current_lr: 0.00004 
     | > step_time: 0.63660  (0.66377)
     | > loader_time: 0.40040  (0.39419)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.01301)
     | > avg_loss:[91m 0.25877 [0m(+0.01002)
     | > avg_log_mle:[91m -0.34309 [0m(+0.00021)
     | > avg_loss_dur:[91m 0.60186 [0m(+0.00981)


[4m[1m > EPOCH: 159/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:03:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 2875[0m
     | > loss: 0.28006  (0.23952)
     | > log_mle: -0.31447  (-0.31983)
     | > loss_dur: 0.59453  (0.55935)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.74788  (1.98530)
     | > current_lr: 0.00004 
     | > step_time: 0.77370  (0.71250)
     | > loader_time: 0.49540  (0.47543)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00200)
     | > avg_loss:[91m 0.27500 [0m(+0.01624)
     | > avg_log_mle:[92m -0.34420 [0m(-0.00111)
     | > avg_loss_dur:[91m 0.61920 [0m(+0.01735)


[4m[1m > EPOCH: 160/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:04:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00100)
     | > avg_loss:[92m 0.26250 [0m(-0.01251)
     | > avg_log_mle:[91m -0.34240 [0m(+0.00180)
     | > avg_loss_dur:[92m 0.60490 [0m(-0.01431)


[4m[1m > EPOCH: 161/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:04:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 2900[0m
     | > loss: 0.22078  (0.21178)
     | > log_mle: -0.33344  (-0.32806)
     | > loss_dur: 0.55422  (0.53984)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.17693  (2.22184)
     | > current_lr: 0.00004 
     | > step_time: 0.55650  (0.60055)
     | > loader_time: 0.33530  (0.33981)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00200)
     | > avg_loss:[92m 0.25115 [0m(-0.01134)
     | > avg_log_mle:[92m -0.34696 [0m(-0.00456)
     | > avg_loss_dur:[92m 0.59811 [0m(-0.00679)


[4m[1m > EPOCH: 162/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:05:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 2925[0m
     | > loss: 0.23547  (0.21831)
     | > log_mle: -0.32786  (-0.32438)
     | > loss_dur: 0.56333  (0.54269)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.79199  (3.00955)
     | > current_lr: 0.00004 
     | > step_time: 0.86680  (0.68507)
     | > loader_time: 0.61060  (0.42772)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00400)
     | > avg_loss:[91m 0.25579 [0m(+0.00463)
     | > avg_log_mle:[92m -0.34905 [0m(-0.00209)
     | > avg_loss_dur:[91m 0.60484 [0m(+0.00673)


[4m[1m > EPOCH: 163/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:05:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 2950[0m
     | > loss: 0.29309  (0.23876)
     | > log_mle: -0.31345  (-0.32226)
     | > loss_dur: 0.60654  (0.56103)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 1.99502  (2.93095)
     | > current_lr: 0.00004 
     | > step_time: 0.94090  (0.75378)
     | > loader_time: 0.55650  (0.48650)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00300)
     | > avg_loss:[91m 0.25901 [0m(+0.00323)
     | > avg_log_mle:[92m -0.34938 [0m(-0.00033)
     | > avg_loss_dur:[91m 0.60840 [0m(+0.00356)


[4m[1m > EPOCH: 164/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:06:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00300)
     | > avg_loss:[92m 0.23204 [0m(-0.02698)
     | > avg_log_mle:[92m -0.35102 [0m(-0.00163)
     | > avg_loss_dur:[92m 0.58305 [0m(-0.02534)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_2970.pth

[4m[1m > EPOCH: 165/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:07:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 2975[0m
     | > loss: 0.19698  (0.20172)
     | > log_mle: -0.32147  (-0.32924)
     | > loss_dur: 0.51845  (0.53096)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.26429  (2.17997)
     | > current_lr: 0.00004 
     | > step_time: 0.73470  (0.66961)
     | > loader_time: 0.41340  (0.40677)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00801)
     | > avg_loss:[91m 0.24329 [0m(+0.01125)
     | > avg_log_mle:[92m -0.35152 [0m(-0.00050)
     | > avg_loss_dur:[91m 0.59481 [0m(+0.01175)


[4m[1m > EPOCH: 166/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:07:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 3000[0m
     | > loss: 0.23588  (0.21556)
     | > log_mle: -0.32914  (-0.32890)
     | > loss_dur: 0.56502  (0.54446)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.90609  (4.10109)
     | > current_lr: 0.00004 
     | > step_time: 0.90780  (0.71015)
     | > loader_time: 0.62660  (0.44415)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00801)
     | > avg_loss:[91m 0.26638 [0m(+0.02309)
     | > avg_log_mle:[91m -0.34727 [0m(+0.00425)
     | > avg_loss_dur:[91m 0.61365 [0m(+0.01884)


[4m[1m > EPOCH: 167/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:08:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07007 [0m(+0.00401)
     | > avg_loss:[91m 0.27155 [0m(+0.00517)
     | > avg_log_mle:[92m -0.35182 [0m(-0.00455)
     | > avg_loss_dur:[91m 0.62337 [0m(+0.00972)


[4m[1m > EPOCH: 168/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:08:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 3025[0m
     | > loss: 0.19595  (0.19595)
     | > log_mle: -0.33295  (-0.33295)
     | > loss_dur: 0.52890  (0.52890)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.33052  (3.33052)
     | > current_lr: 0.00004 
     | > step_time: 0.65260  (0.65259)
     | > loader_time: 0.37830  (0.37834)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[92m 0.24181 [0m(-0.02973)
     | > avg_log_mle:[92m -0.35258 [0m(-0.00077)
     | > avg_loss_dur:[92m 0.59440 [0m(-0.02897)


[4m[1m > EPOCH: 169/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:09:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 3050[0m
     | > loss: 0.20584  (0.19184)
     | > log_mle: -0.33960  (-0.33286)
     | > loss_dur: 0.54544  (0.52469)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.51336  (3.04254)
     | > current_lr: 0.00004 
     | > step_time: 0.67960  (0.66335)
     | > loader_time: 0.41040  (0.41337)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[91m 0.27217 [0m(+0.03035)
     | > avg_log_mle:[91m -0.35161 [0m(+0.00097)
     | > avg_loss_dur:[91m 0.62378 [0m(+0.02938)


[4m[1m > EPOCH: 170/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:09:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 3075[0m
     | > loss: 0.24313  (0.21033)
     | > log_mle: -0.32998  (-0.33289)
     | > loss_dur: 0.57311  (0.54321)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.46440  (3.05633)
     | > current_lr: 0.00004 
     | > step_time: 0.86580  (0.74154)
     | > loader_time: 0.54950  (0.48197)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00100)
     | > avg_loss:[92m 0.25660 [0m(-0.01557)
     | > avg_log_mle:[92m -0.35509 [0m(-0.00348)
     | > avg_loss_dur:[92m 0.61169 [0m(-0.01209)


[4m[1m > EPOCH: 171/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:10:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[92m 0.23334 [0m(-0.02326)
     | > avg_log_mle:[91m -0.35228 [0m(+0.00281)
     | > avg_loss_dur:[92m 0.58561 [0m(-0.02608)


[4m[1m > EPOCH: 172/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:10:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 3100[0m
     | > loss: 0.18367  (0.18452)
     | > log_mle: -0.33536  (-0.33790)
     | > loss_dur: 0.51903  (0.52242)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.34833  (4.38302)
     | > current_lr: 0.00004 
     | > step_time: 0.72370  (0.65109)
     | > loader_time: 0.45140  (0.39361)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00100)
     | > avg_loss:[91m 0.23490 [0m(+0.00156)
     | > avg_log_mle:[92m -0.36197 [0m(-0.00970)
     | > avg_loss_dur:[91m 0.59687 [0m(+0.01126)


[4m[1m > EPOCH: 173/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:11:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 3125[0m
     | > loss: 0.21561  (0.19266)
     | > log_mle: -0.33827  (-0.33673)
     | > loss_dur: 0.55388  (0.52939)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.81664  (2.90025)
     | > current_lr: 0.00004 
     | > step_time: 0.73270  (0.69055)
     | > loader_time: 0.49340  (0.44212)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00601)
     | > avg_loss:[92m 0.22492 [0m(-0.00998)
     | > avg_log_mle:[91m -0.35936 [0m(+0.00262)
     | > avg_loss_dur:[92m 0.58428 [0m(-0.01259)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_3132.pth

[4m[1m > EPOCH: 174/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:11:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00400)
     | > avg_loss:[91m 0.23542 [0m(+0.01050)
     | > avg_log_mle:[92m -0.36178 [0m(-0.00242)
     | > avg_loss_dur:[91m 0.59720 [0m(+0.01292)


[4m[1m > EPOCH: 175/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:12:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 3150[0m
     | > loss: 0.15769  (0.15769)
     | > log_mle: -0.35489  (-0.35489)
     | > loss_dur: 0.51257  (0.51257)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.63340  (3.63340)
     | > current_lr: 0.00004 
     | > step_time: 0.61860  (0.61856)
     | > loader_time: 0.27410  (0.27411)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00400)
     | > avg_loss:[91m 0.23627 [0m(+0.00085)
     | > avg_log_mle:[91m -0.36071 [0m(+0.00108)
     | > avg_loss_dur:[92m 0.59697 [0m(-0.00022)


[4m[1m > EPOCH: 176/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:12:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 3175[0m
     | > loss: 0.18340  (0.17645)
     | > log_mle: -0.34546  (-0.33959)
     | > loss_dur: 0.52886  (0.51603)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.14900  (4.65946)
     | > current_lr: 0.00004 
     | > step_time: 0.64360  (0.66518)
     | > loader_time: 0.42140  (0.40966)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06506 [0m(+0.00100)
     | > avg_loss:[92m 0.23395 [0m(-0.00232)
     | > avg_log_mle:[92m -0.36311 [0m(-0.00241)
     | > avg_loss_dur:[91m 0.59706 [0m(+0.00009)


[4m[1m > EPOCH: 177/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:13:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 3200[0m
     | > loss: 0.25462  (0.19012)
     | > log_mle: -0.32962  (-0.34138)
     | > loss_dur: 0.58424  (0.53151)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.38487  (3.18741)
     | > current_lr: 0.00004 
     | > step_time: 1.00490  (0.73488)
     | > loader_time: 0.61260  (0.46578)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00300)
     | > avg_loss:[91m 0.24291 [0m(+0.00896)
     | > avg_log_mle:[92m -0.36437 [0m(-0.00126)
     | > avg_loss_dur:[91m 0.60728 [0m(+0.01022)


[4m[1m > EPOCH: 178/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:13:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00501)
     | > avg_loss:[92m 0.23919 [0m(-0.00372)
     | > avg_log_mle:[92m -0.36472 [0m(-0.00035)
     | > avg_loss_dur:[92m 0.60391 [0m(-0.00337)


[4m[1m > EPOCH: 179/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:14:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 3225[0m
     | > loss: 0.16686  (0.16426)
     | > log_mle: -0.34648  (-0.34893)
     | > loss_dur: 0.51334  (0.51319)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.92998  (3.02767)
     | > current_lr: 0.00004 
     | > step_time: 0.67360  (0.62457)
     | > loader_time: 0.40540  (0.37134)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00501)
     | > avg_loss:[91m 0.24481 [0m(+0.00562)
     | > avg_log_mle:[92m -0.36493 [0m(-0.00021)
     | > avg_loss_dur:[91m 0.60974 [0m(+0.00583)


[4m[1m > EPOCH: 180/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:14:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 3250[0m
     | > loss: 0.21778  (0.17279)
     | > log_mle: -0.33338  (-0.34515)
     | > loss_dur: 0.55116  (0.51794)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.51870  (3.33484)
     | > current_lr: 0.00005 
     | > step_time: 0.69460  (0.68833)
     | > loader_time: 0.45240  (0.43159)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00200)
     | > avg_loss:[92m 0.24151 [0m(-0.00330)
     | > avg_log_mle:[92m -0.36669 [0m(-0.00176)
     | > avg_loss_dur:[92m 0.60820 [0m(-0.00154)


[4m[1m > EPOCH: 181/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:15:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 3275[0m
     | > loss: 0.23543  (0.18957)
     | > log_mle: -0.34386  (-0.34423)
     | > loss_dur: 0.57929  (0.53380)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.31952  (3.54153)
     | > current_lr: 0.00005 
     | > step_time: 0.83680  (0.76075)
     | > loader_time: 0.43840  (0.50499)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00000)
     | > avg_loss:[92m 0.23481 [0m(-0.00670)
     | > avg_log_mle:[92m -0.36856 [0m(-0.00187)
     | > avg_loss_dur:[92m 0.60337 [0m(-0.00483)


[4m[1m > EPOCH: 182/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:15:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00500)
     | > avg_loss:[92m 0.21282 [0m(-0.02199)
     | > avg_log_mle:[92m -0.36973 [0m(-0.00117)
     | > avg_loss_dur:[92m 0.58255 [0m(-0.02082)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_3294.pth

[4m[1m > EPOCH: 183/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:16:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 3300[0m
     | > loss: 0.16205  (0.15291)
     | > log_mle: -0.33314  (-0.34581)
     | > loss_dur: 0.49519  (0.49871)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 7.56654  (4.56109)
     | > current_lr: 0.00005 
     | > step_time: 0.63760  (0.66227)
     | > loader_time: 0.38740  (0.44173)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00700)
     | > avg_loss:[91m 0.26894 [0m(+0.05612)
     | > avg_log_mle:[91m -0.36885 [0m(+0.00088)
     | > avg_loss_dur:[91m 0.63779 [0m(+0.05524)


[4m[1m > EPOCH: 184/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:16:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 3325[0m
     | > loss: 0.21232  (0.16824)
     | > log_mle: -0.34357  (-0.34879)
     | > loss_dur: 0.55590  (0.51703)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.03051  (4.06580)
     | > current_lr: 0.00005 
     | > step_time: 0.77970  (0.71365)
     | > loader_time: 0.47040  (0.45464)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.01001)
     | > avg_loss:[92m 0.25136 [0m(-0.01758)
     | > avg_log_mle:[92m -0.37244 [0m(-0.00359)
     | > avg_loss_dur:[92m 0.62381 [0m(-0.01399)


[4m[1m > EPOCH: 185/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:17:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06705 [0m(+0.00499)
     | > avg_loss:[91m 0.25563 [0m(+0.00427)
     | > avg_log_mle:[91m -0.37123 [0m(+0.00121)
     | > avg_loss_dur:[91m 0.62686 [0m(+0.00306)


[4m[1m > EPOCH: 186/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:17:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 3350[0m
     | > loss: 0.14757  (0.14416)
     | > log_mle: -0.36090  (-0.35561)
     | > loss_dur: 0.50847  (0.49977)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.19556  (4.56157)
     | > current_lr: 0.00005 
     | > step_time: 0.55350  (0.60005)
     | > loader_time: 0.34730  (0.35782)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00602)
     | > avg_loss:[92m 0.23076 [0m(-0.02487)
     | > avg_log_mle:[92m -0.37235 [0m(-0.00112)
     | > avg_loss_dur:[92m 0.60311 [0m(-0.02375)


[4m[1m > EPOCH: 187/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:18:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 3375[0m
     | > loss: 0.15914  (0.14450)
     | > log_mle: -0.35636  (-0.35328)
     | > loss_dur: 0.51550  (0.49778)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.36908  (4.61395)
     | > current_lr: 0.00005 
     | > step_time: 0.87080  (0.68652)
     | > loader_time: 0.57750  (0.42850)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06505 [0m(-0.00802)
     | > avg_loss:[91m 0.24294 [0m(+0.01217)
     | > avg_log_mle:[92m -0.37499 [0m(-0.00264)
     | > avg_loss_dur:[91m 0.61792 [0m(+0.01481)


[4m[1m > EPOCH: 188/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:18:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 3400[0m
     | > loss: 0.24199  (0.16707)
     | > log_mle: -0.34151  (-0.35209)
     | > loss_dur: 0.58350  (0.51916)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.39274  (3.07161)
     | > current_lr: 0.00005 
     | > step_time: 0.94690  (0.75745)
     | > loader_time: 0.59050  (0.47042)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00099)
     | > avg_loss:[92m 0.24214 [0m(-0.00080)
     | > avg_log_mle:[91m -0.37380 [0m(+0.00118)
     | > avg_loss_dur:[92m 0.61594 [0m(-0.00198)


[4m[1m > EPOCH: 189/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:19:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00200)
     | > avg_loss:[91m 0.24325 [0m(+0.00112)
     | > avg_log_mle:[92m -0.37549 [0m(-0.00169)
     | > avg_loss_dur:[91m 0.61875 [0m(+0.00281)


[4m[1m > EPOCH: 190/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:19:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 3425[0m
     | > loss: 0.12947  (0.13072)
     | > log_mle: -0.35060  (-0.35734)
     | > loss_dur: 0.48007  (0.48805)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.21073  (3.82420)
     | > current_lr: 0.00005 
     | > step_time: 0.73370  (0.66621)
     | > loader_time: 0.45240  (0.40496)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06605 [0m(+0.00399)
     | > avg_loss:[92m 0.22473 [0m(-0.01852)
     | > avg_log_mle:[92m -0.37735 [0m(-0.00185)
     | > avg_loss_dur:[92m 0.60208 [0m(-0.01667)


[4m[1m > EPOCH: 191/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:20:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 3450[0m
     | > loss: 0.17020  (0.14174)
     | > log_mle: -0.35618  (-0.35663)
     | > loss_dur: 0.52639  (0.49838)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 6.21440  (3.29428)
     | > current_lr: 0.00005 
     | > step_time: 0.92080  (0.70915)
     | > loader_time: 0.62260  (0.44532)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00402)
     | > avg_loss:[91m 0.25015 [0m(+0.02541)
     | > avg_log_mle:[91m -0.37688 [0m(+0.00047)
     | > avg_loss_dur:[91m 0.62702 [0m(+0.02494)


[4m[1m > EPOCH: 192/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:21:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00300)
     | > avg_loss:[92m 0.21768 [0m(-0.03247)
     | > avg_log_mle:[91m -0.37386 [0m(+0.00302)
     | > avg_loss_dur:[92m 0.59154 [0m(-0.03548)


[4m[1m > EPOCH: 193/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:21:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 3475[0m
     | > loss: 0.10880  (0.10880)
     | > log_mle: -0.36037  (-0.36037)
     | > loss_dur: 0.46917  (0.46917)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.21020  (4.21020)
     | > current_lr: 0.00005 
     | > step_time: 0.64560  (0.64559)
     | > loader_time: 0.37730  (0.37734)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00901)
     | > avg_loss:[91m 0.23611 [0m(+0.01843)
     | > avg_log_mle:[92m -0.37838 [0m(-0.00452)
     | > avg_loss_dur:[91m 0.61449 [0m(+0.02295)


[4m[1m > EPOCH: 194/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:22:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 3500[0m
     | > loss: 0.13189  (0.11645)
     | > log_mle: -0.36891  (-0.36197)
     | > loss_dur: 0.50079  (0.47842)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.58823  (2.60137)
     | > current_lr: 0.00005 
     | > step_time: 0.67760  (0.66173)
     | > loader_time: 0.38840  (0.44691)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00300)
     | > avg_loss:[92m 0.23464 [0m(-0.00147)
     | > avg_log_mle:[91m -0.37751 [0m(+0.00086)
     | > avg_loss_dur:[92m 0.61215 [0m(-0.00233)


[4m[1m > EPOCH: 195/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:22:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 3525[0m
     | > loss: 0.17619  (0.13857)
     | > log_mle: -0.35521  (-0.35911)
     | > loss_dur: 0.53140  (0.49768)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 5.03401  (4.38659)
     | > current_lr: 0.00005 
     | > step_time: 0.87480  (0.74621)
     | > loader_time: 0.55850  (0.47276)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00500)
     | > avg_loss:[91m 0.24251 [0m(+0.00787)
     | > avg_log_mle:[91m -0.37591 [0m(+0.00160)
     | > avg_loss_dur:[91m 0.61842 [0m(+0.00627)


[4m[1m > EPOCH: 196/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:23:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[91m 0.25824 [0m(+0.01573)
     | > avg_log_mle:[92m -0.38055 [0m(-0.00463)
     | > avg_loss_dur:[91m 0.63879 [0m(+0.02036)


[4m[1m > EPOCH: 197/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:23:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 3550[0m
     | > loss: 0.12109  (0.10459)
     | > log_mle: -0.36335  (-0.36554)
     | > loss_dur: 0.48444  (0.47012)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.47703  (6.60450)
     | > current_lr: 0.00005 
     | > step_time: 0.71970  (0.65259)
     | > loader_time: 0.47340  (0.39761)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00400)
     | > avg_loss:[92m 0.24557 [0m(-0.01267)
     | > avg_log_mle:[92m -0.38219 [0m(-0.00164)
     | > avg_loss_dur:[92m 0.62776 [0m(-0.01103)


[4m[1m > EPOCH: 198/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:24:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 3575[0m
     | > loss: 0.14686  (0.12003)
     | > log_mle: -0.36507  (-0.36434)
     | > loss_dur: 0.51193  (0.48437)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.49222  (4.46385)
     | > current_lr: 0.00005 
     | > step_time: 0.73270  (0.69127)
     | > loader_time: 0.47840  (0.44713)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[91m 0.25591 [0m(+0.01034)
     | > avg_log_mle:[91m -0.38018 [0m(+0.00201)
     | > avg_loss_dur:[91m 0.63609 [0m(+0.00833)


[4m[1m > EPOCH: 199/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:24:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00601)
     | > avg_loss:[91m 0.25944 [0m(+0.00353)
     | > avg_log_mle:[91m -0.37780 [0m(+0.00238)
     | > avg_loss_dur:[91m 0.63724 [0m(+0.00115)


[4m[1m > EPOCH: 200/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:25:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 3600[0m
     | > loss: 0.04059  (0.04059)
     | > log_mle: -0.37522  (-0.37522)
     | > loss_dur: 0.41581  (0.41581)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.65920  (4.65920)
     | > current_lr: 0.00005 
     | > step_time: 0.49040  (0.49045)
     | > loader_time: 0.28830  (0.28826)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07407 [0m(-0.00200)
     | > avg_loss:[92m 0.20463 [0m(-0.05481)
     | > avg_log_mle:[92m -0.38410 [0m(-0.00630)
     | > avg_loss_dur:[92m 0.58873 [0m(-0.04851)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_3618.pth

[4m[1m > EPOCH: 201/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:25:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 3625[0m
     | > loss: 0.12064  (0.09989)
     | > log_mle: -0.36763  (-0.36572)
     | > loss_dur: 0.48827  (0.46562)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.14454  (6.25099)
     | > current_lr: 0.00005 
     | > step_time: 0.64460  (0.66461)
     | > loader_time: 0.40940  (0.42739)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00601)
     | > avg_loss:[91m 0.23250 [0m(+0.02787)
     | > avg_log_mle:[92m -0.38598 [0m(-0.00187)
     | > avg_loss_dur:[91m 0.61848 [0m(+0.02975)


[4m[1m > EPOCH: 202/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:26:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 3650[0m
     | > loss: 0.19495  (0.12011)
     | > log_mle: -0.35324  (-0.36577)
     | > loss_dur: 0.54819  (0.48588)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.15904  (4.54229)
     | > current_lr: 0.00005 
     | > step_time: 1.00590  (0.73510)
     | > loader_time: 0.59150  (0.45591)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00400)
     | > avg_loss:[91m 0.26196 [0m(+0.02946)
     | > avg_log_mle:[91m -0.38501 [0m(+0.00097)
     | > avg_loss_dur:[91m 0.64697 [0m(+0.02850)


[4m[1m > EPOCH: 203/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:26:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00601)
     | > avg_loss:[92m 0.23644 [0m(-0.02552)
     | > avg_log_mle:[92m -0.38570 [0m(-0.00069)
     | > avg_loss_dur:[92m 0.62215 [0m(-0.02483)


[4m[1m > EPOCH: 204/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:27:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 3675[0m
     | > loss: 0.08909  (0.07823)
     | > log_mle: -0.37126  (-0.37467)
     | > loss_dur: 0.46034  (0.45289)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 6.68150  (4.11637)
     | > current_lr: 0.00005 
     | > step_time: 0.68660  (0.62757)
     | > loader_time: 0.43440  (0.38201)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00200)
     | > avg_loss:[91m 0.25842 [0m(+0.02198)
     | > avg_log_mle:[92m -0.38772 [0m(-0.00202)
     | > avg_loss_dur:[91m 0.64614 [0m(+0.02399)


[4m[1m > EPOCH: 205/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:27:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 3700[0m
     | > loss: 0.15052  (0.09513)
     | > log_mle: -0.35528  (-0.36933)
     | > loss_dur: 0.50580  (0.46445)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.07861  (6.89534)
     | > current_lr: 0.00005 
     | > step_time: 0.70060  (0.68953)
     | > loader_time: 0.42540  (0.42078)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00701)
     | > avg_loss:[91m 0.26857 [0m(+0.01015)
     | > avg_log_mle:[91m -0.37652 [0m(+0.01120)
     | > avg_loss_dur:[92m 0.64509 [0m(-0.00105)


[4m[1m > EPOCH: 206/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:28:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 3725[0m
     | > loss: 0.17468  (0.11945)
     | > log_mle: -0.36619  (-0.36681)
     | > loss_dur: 0.54087  (0.48626)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 9.06682  (5.42429)
     | > current_lr: 0.00005 
     | > step_time: 0.84980  (0.76614)
     | > loader_time: 0.44340  (0.47973)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00500)
     | > avg_loss:[92m 0.24797 [0m(-0.02059)
     | > avg_log_mle:[92m -0.38379 [0m(-0.00726)
     | > avg_loss_dur:[92m 0.63176 [0m(-0.01333)


[4m[1m > EPOCH: 207/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:28:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[91m 0.27063 [0m(+0.02266)
     | > avg_log_mle:[91m -0.37372 [0m(+0.01007)
     | > avg_loss_dur:[91m 0.64435 [0m(+0.01259)


[4m[1m > EPOCH: 208/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:29:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 3750[0m
     | > loss: 0.07720  (0.07204)
     | > log_mle: -0.35759  (-0.37045)
     | > loss_dur: 0.43479  (0.44248)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.58702  (3.69077)
     | > current_lr: 0.00005 
     | > step_time: 0.63360  (0.66344)
     | > loader_time: 0.38940  (0.40337)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00500)
     | > avg_loss:[92m 0.25619 [0m(-0.01444)
     | > avg_log_mle:[92m -0.38452 [0m(-0.01080)
     | > avg_loss_dur:[92m 0.64071 [0m(-0.00364)


[4m[1m > EPOCH: 209/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:29:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 3775[0m
     | > loss: 0.13656  (0.08954)
     | > log_mle: -0.36565  (-0.37149)
     | > loss_dur: 0.50221  (0.46103)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 7.35698  (5.99268)
     | > current_lr: 0.00005 
     | > step_time: 0.78170  (0.71604)
     | > loader_time: 0.45640  (0.45564)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00601)
     | > avg_loss:[91m 0.27355 [0m(+0.01736)
     | > avg_log_mle:[92m -0.38543 [0m(-0.00091)
     | > avg_loss_dur:[91m 0.65898 [0m(+0.01827)


[4m[1m > EPOCH: 210/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:30:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00100)
     | > avg_loss:[92m 0.26915 [0m(-0.00440)
     | > avg_log_mle:[92m -0.38730 [0m(-0.00187)
     | > avg_loss_dur:[92m 0.65645 [0m(-0.00253)


[4m[1m > EPOCH: 211/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:30:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 3800[0m
     | > loss: 0.04828  (0.04165)
     | > log_mle: -0.38658  (-0.38287)
     | > loss_dur: 0.43486  (0.42452)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 5.47719  (4.19000)
     | > current_lr: 0.00005 
     | > step_time: 0.56550  (0.60755)
     | > loader_time: 0.35930  (0.37784)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[92m 0.25686 [0m(-0.01229)
     | > avg_log_mle:[92m -0.38730 [0m(-0.00000)
     | > avg_loss_dur:[92m 0.64416 [0m(-0.01229)


[4m[1m > EPOCH: 212/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:31:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 3825[0m
     | > loss: 0.07168  (0.05648)
     | > log_mle: -0.38351  (-0.37892)
     | > loss_dur: 0.45519  (0.43540)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.28329  (4.68084)
     | > current_lr: 0.00005 
     | > step_time: 0.86580  (0.68796)
     | > loader_time: 0.57350  (0.42138)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00500)
     | > avg_loss:[92m 0.24492 [0m(-0.01194)
     | > avg_log_mle:[92m -0.39003 [0m(-0.00273)
     | > avg_loss_dur:[92m 0.63495 [0m(-0.00921)


[4m[1m > EPOCH: 213/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:31:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 3850[0m
     | > loss: 0.18765  (0.08985)
     | > log_mle: -0.36180  (-0.37560)
     | > loss_dur: 0.54945  (0.46545)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.79656  (4.74863)
     | > current_lr: 0.00005 
     | > step_time: 0.95190  (0.76000)
     | > loader_time: 0.59550  (0.48119)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00400)
     | > avg_loss:[91m 0.25852 [0m(+0.01361)
     | > avg_log_mle:[92m -0.39036 [0m(-0.00033)
     | > avg_loss_dur:[91m 0.64889 [0m(+0.01394)


[4m[1m > EPOCH: 214/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:32:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00400)
     | > avg_loss:[92m 0.23840 [0m(-0.02012)
     | > avg_log_mle:[92m -0.39303 [0m(-0.00267)
     | > avg_loss_dur:[92m 0.63144 [0m(-0.01745)


[4m[1m > EPOCH: 215/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:32:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 3875[0m
     | > loss: 0.04114  (0.03195)
     | > log_mle: -0.37515  (-0.38206)
     | > loss_dur: 0.41629  (0.41401)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 3.40278  (3.83459)
     | > current_lr: 0.00005 
     | > step_time: 0.73770  (0.67181)
     | > loader_time: 0.44340  (0.41398)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00400)
     | > avg_loss:[91m 0.25420 [0m(+0.01580)
     | > avg_log_mle:[92m -0.39371 [0m(-0.00067)
     | > avg_loss_dur:[91m 0.64791 [0m(+0.01647)


[4m[1m > EPOCH: 216/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:33:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 3900[0m
     | > loss: 0.10163  (0.05925)
     | > log_mle: -0.38003  (-0.38080)
     | > loss_dur: 0.48166  (0.44005)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 12.37176  (5.39827)
     | > current_lr: 0.00005 
     | > step_time: 0.91880  (0.71206)
     | > loader_time: 0.63060  (0.44107)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00400)
     | > avg_loss:[92m 0.23966 [0m(-0.01454)
     | > avg_log_mle:[92m -0.39458 [0m(-0.00087)
     | > avg_loss_dur:[92m 0.63424 [0m(-0.01367)


[4m[1m > EPOCH: 217/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:33:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00701)
     | > avg_loss:[91m 0.28405 [0m(+0.04440)
     | > avg_log_mle:[91m -0.38671 [0m(+0.00786)
     | > avg_loss_dur:[91m 0.67077 [0m(+0.03653)


[4m[1m > EPOCH: 218/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:34:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 3925[0m
     | > loss: 0.00731  (0.00731)
     | > log_mle: -0.38468  (-0.38468)
     | > loss_dur: 0.39199  (0.39199)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 8.11629  (8.11629)
     | > current_lr: 0.00005 
     | > step_time: 0.65260  (0.65259)
     | > loader_time: 0.36130  (0.36133)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00400)
     | > avg_loss:[92m 0.26243 [0m(-0.02162)
     | > avg_log_mle:[92m -0.38898 [0m(-0.00226)
     | > avg_loss_dur:[92m 0.65141 [0m(-0.01936)


[4m[1m > EPOCH: 219/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:34:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 3950[0m
     | > loss: 0.06525  (0.03507)
     | > log_mle: -0.38242  (-0.38208)
     | > loss_dur: 0.44767  (0.41715)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 16.73685  (8.29014)
     | > current_lr: 0.00005 
     | > step_time: 0.68160  (0.66636)
     | > loader_time: 0.40540  (0.41162)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00200)
     | > avg_loss:[91m 0.26943 [0m(+0.00700)
     | > avg_log_mle:[92m -0.39222 [0m(-0.00324)
     | > avg_loss_dur:[91m 0.66165 [0m(+0.01024)


[4m[1m > EPOCH: 220/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:35:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 3975[0m
     | > loss: 0.12520  (0.06067)
     | > log_mle: -0.37096  (-0.37875)
     | > loss_dur: 0.49616  (0.43942)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 6.86344  (5.82887)
     | > current_lr: 0.00006 
     | > step_time: 0.88600  (0.74770)
     | > loader_time: 0.55810  (0.47687)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00000)
     | > avg_loss:[92m 0.25414 [0m(-0.01529)
     | > avg_log_mle:[91m -0.38019 [0m(+0.01202)
     | > avg_loss_dur:[92m 0.63434 [0m(-0.02731)


[4m[1m > EPOCH: 221/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:36:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00000)
     | > avg_loss:[91m 0.25521 [0m(+0.00107)
     | > avg_log_mle:[92m -0.39653 [0m(-0.01633)
     | > avg_loss_dur:[91m 0.65173 [0m(+0.01740)


[4m[1m > EPOCH: 222/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:36:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 4000[0m
     | > loss: 0.01602  (0.00443)
     | > log_mle: -0.38524  (-0.38623)
     | > loss_dur: 0.40126  (0.39066)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 8.12167  (11.90227)
     | > current_lr: 0.00006 
     | > step_time: 0.73070  (0.65685)
     | > loader_time: 0.50550  (0.41388)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[91m 0.25528 [0m(+0.00007)
     | > avg_log_mle:[91m -0.39257 [0m(+0.00396)
     | > avg_loss_dur:[92m 0.64785 [0m(-0.00388)


[4m[1m > EPOCH: 223/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:37:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 4025[0m
     | > loss: 0.04041  (0.03091)
     | > log_mle: -0.38601  (-0.38454)
     | > loss_dur: 0.42642  (0.41545)
     | > amp_scaler: 65536.00000  (65536.00000)
     | > grad_norm: 8.84625  (5.28854)
     | > current_lr: 0.00006 
     | > step_time: 0.73970  (0.69291)
     | > loader_time: 0.46940  (0.42593)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00701)
     | > avg_loss:[92m 0.23081 [0m(-0.02447)
     | > avg_log_mle:[92m -0.39707 [0m(-0.00450)
     | > avg_loss_dur:[92m 0.62788 [0m(-0.01997)


[4m[1m > EPOCH: 224/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:37:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[91m 0.24684 [0m(+0.01603)
     | > avg_log_mle:[91m -0.39341 [0m(+0.00366)
     | > avg_loss_dur:[91m 0.64025 [0m(+0.01237)


[4m[1m > EPOCH: 225/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:38:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 4050[0m
     | > loss: -0.07479  (-0.07479)
     | > log_mle: -0.40348  (-0.40348)
     | > loss_dur: 0.32869  (0.32869)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 4.15561  (4.15561)
     | > current_lr: 0.00006 
     | > step_time: 0.64160  (0.64158)
     | > loader_time: 0.27420  (0.27424)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00400)
     | > avg_loss:[92m 0.23519 [0m(-0.01165)
     | > avg_log_mle:[92m -0.39913 [0m(-0.00571)
     | > avg_loss_dur:[92m 0.63431 [0m(-0.00594)


[4m[1m > EPOCH: 226/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:38:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 4075[0m
     | > loss: 0.03169  (0.00120)
     | > log_mle: -0.39060  (-0.38695)
     | > loss_dur: 0.42229  (0.38814)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 6.34247  (5.16186)
     | > current_lr: 0.00006 
     | > step_time: 0.64960  (0.66303)
     | > loader_time: 0.39640  (0.42367)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00400)
     | > avg_loss:[91m 0.24664 [0m(+0.01146)
     | > avg_log_mle:[91m -0.39443 [0m(+0.00469)
     | > avg_loss_dur:[91m 0.64108 [0m(+0.00676)


[4m[1m > EPOCH: 227/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:39:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 4100[0m
     | > loss: 0.11893  (0.03373)
     | > log_mle: -0.37110  (-0.38490)
     | > loss_dur: 0.49003  (0.41863)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 11.92320  (8.34517)
     | > current_lr: 0.00006 
     | > step_time: 1.01390  (0.73810)
     | > loader_time: 0.58250  (0.46750)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.01401)
     | > avg_loss:[91m 0.28349 [0m(+0.03684)
     | > avg_log_mle:[91m -0.37830 [0m(+0.01613)
     | > avg_loss_dur:[91m 0.66179 [0m(+0.02071)


[4m[1m > EPOCH: 228/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:39:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00400)
     | > avg_loss:[92m 0.23665 [0m(-0.04684)
     | > avg_log_mle:[92m -0.39796 [0m(-0.01966)
     | > avg_loss_dur:[92m 0.63461 [0m(-0.02719)


[4m[1m > EPOCH: 229/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:40:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 4125[0m
     | > loss: -0.02528  (-0.03153)
     | > log_mle: -0.39116  (-0.39442)
     | > loss_dur: 0.36588  (0.36289)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.70221  (4.56911)
     | > current_lr: 0.00006 
     | > step_time: 0.68260  (0.62790)
     | > loader_time: 0.60250  (0.44907)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00501)
     | > avg_loss:[92m 0.22518 [0m(-0.01147)
     | > avg_log_mle:[91m -0.39686 [0m(+0.00110)
     | > avg_loss_dur:[92m 0.62203 [0m(-0.01257)


[4m[1m > EPOCH: 230/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:40:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 4150[0m
     | > loss: 0.04214  (0.00349)
     | > log_mle: -0.37404  (-0.39054)
     | > loss_dur: 0.41617  (0.39403)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 6.04314  (4.70901)
     | > current_lr: 0.00006 
     | > step_time: 0.70360  (0.68803)
     | > loader_time: 0.48040  (0.44310)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00500)
     | > avg_loss:[91m 0.25035 [0m(+0.02517)
     | > avg_log_mle:[92m -0.39927 [0m(-0.00241)
     | > avg_loss_dur:[91m 0.64961 [0m(+0.02758)


[4m[1m > EPOCH: 231/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:41:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 4175[0m
     | > loss: 0.11086  (0.04126)
     | > log_mle: -0.38339  (-0.38644)
     | > loss_dur: 0.49425  (0.42770)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 10.38157  (8.47909)
     | > current_lr: 0.00006 
     | > step_time: 0.85080  (0.76717)
     | > loader_time: 0.42540  (0.48073)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00300)
     | > avg_loss:[92m 0.24412 [0m(-0.00622)
     | > avg_log_mle:[91m -0.39873 [0m(+0.00054)
     | > avg_loss_dur:[92m 0.64286 [0m(-0.00676)


[4m[1m > EPOCH: 232/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:41:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.01201)
     | > avg_loss:[92m 0.24101 [0m(-0.00312)
     | > avg_log_mle:[92m -0.40098 [0m(-0.00225)
     | > avg_loss_dur:[92m 0.64199 [0m(-0.00086)


[4m[1m > EPOCH: 233/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:42:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 4200[0m
     | > loss: 0.00618  (-0.02274)
     | > log_mle: -0.37821  (-0.39174)
     | > loss_dur: 0.38439  (0.36900)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 8.47590  (8.01152)
     | > current_lr: 0.00006 
     | > step_time: 0.63960  (0.67061)
     | > loader_time: 0.44140  (0.42021)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.01101)
     | > avg_loss:[92m 0.23640 [0m(-0.00461)
     | > avg_log_mle:[91m -0.39710 [0m(+0.00388)
     | > avg_loss_dur:[92m 0.63350 [0m(-0.00849)


[4m[1m > EPOCH: 234/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:42:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 4225[0m
     | > loss: 0.07159  (0.00432)
     | > log_mle: -0.38574  (-0.39258)
     | > loss_dur: 0.45733  (0.39690)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.85750  (5.60555)
     | > current_lr: 0.00006 
     | > step_time: 0.77370  (0.71689)
     | > loader_time: 0.47640  (0.45195)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00601)
     | > avg_loss:[91m 0.27048 [0m(+0.03408)
     | > avg_log_mle:[91m -0.39590 [0m(+0.00121)
     | > avg_loss_dur:[91m 0.66638 [0m(+0.03287)


[4m[1m > EPOCH: 235/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:43:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00100)
     | > avg_loss:[92m 0.25036 [0m(-0.02012)
     | > avg_log_mle:[92m -0.39918 [0m(-0.00328)
     | > avg_loss_dur:[92m 0.64954 [0m(-0.01684)


[4m[1m > EPOCH: 236/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:43:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 4250[0m
     | > loss: -0.06144  (-0.06832)
     | > log_mle: -0.40330  (-0.40085)
     | > loss_dur: 0.34186  (0.33253)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 11.56659  (7.19938)
     | > current_lr: 0.00006 
     | > step_time: 0.55950  (0.60005)
     | > loader_time: 0.32730  (0.35832)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00701)
     | > avg_loss:[92m 0.21659 [0m(-0.03377)
     | > avg_log_mle:[92m -0.39955 [0m(-0.00038)
     | > avg_loss_dur:[92m 0.61615 [0m(-0.03339)


[4m[1m > EPOCH: 237/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:44:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 4275[0m
     | > loss: 0.01546  (-0.02371)
     | > log_mle: -0.39937  (-0.39731)
     | > loss_dur: 0.41482  (0.37360)
     | > amp_scaler: 32768.00000  (32768.00000)
     | > grad_norm: 2.42481  (3.91058)
     | > current_lr: 0.00006 
     | > step_time: 0.86880  (0.68685)
     | > loader_time: 0.59350  (0.42728)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[91m 0.23189 [0m(+0.01529)
     | > avg_log_mle:[91m -0.39699 [0m(+0.00256)
     | > avg_loss_dur:[91m 0.62888 [0m(+0.01273)


[4m[1m > EPOCH: 238/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:44:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 4300[0m
     | > loss: 0.16240  (0.01252)
     | > log_mle: -0.36876  (-0.39113)
     | > loss_dur: 0.53116  (0.40365)
     | > amp_scaler: 16384.00000  (28672.00000)
     | > grad_norm: 4.57817  (8.01618)
     | > current_lr: 0.00006 
     | > step_time: 0.94590  (0.75988)
     | > loader_time: 0.57650  (0.47543)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.01101)
     | > avg_loss:[91m 0.25685 [0m(+0.02496)
     | > avg_log_mle:[91m -0.39680 [0m(+0.00019)
     | > avg_loss_dur:[91m 0.65365 [0m(+0.02477)


[4m[1m > EPOCH: 239/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:45:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00601)
     | > avg_loss:[92m 0.24997 [0m(-0.00688)
     | > avg_log_mle:[92m -0.39866 [0m(-0.00186)
     | > avg_loss_dur:[92m 0.64863 [0m(-0.00501)


[4m[1m > EPOCH: 240/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:45:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 4325[0m
     | > loss: -0.04020  (-0.04845)
     | > log_mle: -0.39318  (-0.39698)
     | > loss_dur: 0.35299  (0.34853)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.16134  (4.06375)
     | > current_lr: 0.00006 
     | > step_time: 0.73770  (0.67041)
     | > loader_time: 0.41140  (0.40517)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00500)
     | > avg_loss:[92m 0.21780 [0m(-0.03217)
     | > avg_log_mle:[92m -0.40263 [0m(-0.00397)
     | > avg_loss_dur:[92m 0.62043 [0m(-0.02820)


[4m[1m > EPOCH: 241/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:46:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 4350[0m
     | > loss: 0.02970  (-0.01354)
     | > log_mle: -0.39120  (-0.39519)
     | > loss_dur: 0.42090  (0.38165)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.52126  (6.62903)
     | > current_lr: 0.00006 
     | > step_time: 0.90980  (0.71416)
     | > loader_time: 0.65360  (0.44264)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00801)
     | > avg_loss:[91m 0.25328 [0m(+0.03548)
     | > avg_log_mle:[91m -0.39984 [0m(+0.00279)
     | > avg_loss_dur:[91m 0.65312 [0m(+0.03269)


[4m[1m > EPOCH: 242/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:46:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07806 [0m(+0.00399)
     | > avg_loss:[92m 0.24304 [0m(-0.01024)
     | > avg_log_mle:[91m -0.39965 [0m(+0.00018)
     | > avg_loss_dur:[92m 0.64270 [0m(-0.01042)


[4m[1m > EPOCH: 243/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:47:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 4375[0m
     | > loss: -0.09758  (-0.09758)
     | > log_mle: -0.40476  (-0.40476)
     | > loss_dur: 0.30718  (0.30718)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.29171  (5.29171)
     | > current_lr: 0.00006 
     | > step_time: 0.66460  (0.66461)
     | > loader_time: 0.37830  (0.37834)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06304 [0m(-0.01501)
     | > avg_loss:[92m 0.24033 [0m(-0.00271)
     | > avg_log_mle:[92m -0.40664 [0m(-0.00699)
     | > avg_loss_dur:[91m 0.64697 [0m(+0.00428)


[4m[1m > EPOCH: 244/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:48:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 4400[0m
     | > loss: -0.02325  (-0.05314)
     | > log_mle: -0.40648  (-0.40161)
     | > loss_dur: 0.38323  (0.34847)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.25884  (5.90391)
     | > current_lr: 0.00006 
     | > step_time: 0.67960  (0.66498)
     | > loader_time: 0.45340  (0.42589)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00902)
     | > avg_loss:[91m 0.24975 [0m(+0.00942)
     | > avg_log_mle:[91m -0.40439 [0m(+0.00226)
     | > avg_loss_dur:[91m 0.65414 [0m(+0.00717)


[4m[1m > EPOCH: 245/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:48:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 4425[0m
     | > loss: 0.06126  (-0.00666)
     | > log_mle: -0.38992  (-0.39640)
     | > loss_dur: 0.45118  (0.38974)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.51600  (7.31625)
     | > current_lr: 0.00006 
     | > step_time: 0.87380  (0.74708)
     | > loader_time: 0.53750  (0.47703)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00000)
     | > avg_loss:[91m 0.25915 [0m(+0.00940)
     | > avg_log_mle:[92m -0.40708 [0m(-0.00269)
     | > avg_loss_dur:[91m 0.66623 [0m(+0.01209)


[4m[1m > EPOCH: 246/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:49:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07207 [0m(+0.00000)
     | > avg_loss:[92m 0.24445 [0m(-0.01470)
     | > avg_log_mle:[92m -0.40823 [0m(-0.00115)
     | > avg_loss_dur:[92m 0.65267 [0m(-0.01355)


[4m[1m > EPOCH: 247/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:49:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 4450[0m
     | > loss: -0.06995  (-0.08624)
     | > log_mle: -0.40340  (-0.40720)
     | > loss_dur: 0.33345  (0.32096)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 23.34729  (10.05636)
     | > current_lr: 0.00006 
     | > step_time: 0.72570  (0.65336)
     | > loader_time: 0.45740  (0.43489)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[92m 0.23862 [0m(-0.00583)
     | > avg_log_mle:[91m -0.40501 [0m(+0.00322)
     | > avg_loss_dur:[92m 0.64362 [0m(-0.00905)


[4m[1m > EPOCH: 248/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:50:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 4475[0m
     | > loss: -0.01161  (-0.04240)
     | > log_mle: -0.40168  (-0.40194)
     | > loss_dur: 0.39007  (0.35953)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.47679  (5.62714)
     | > current_lr: 0.00006 
     | > step_time: 0.74170  (0.69463)
     | > loader_time: 0.47940  (0.43476)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00801)
     | > avg_loss:[91m 0.26097 [0m(+0.02235)
     | > avg_log_mle:[91m -0.40117 [0m(+0.00383)
     | > avg_loss_dur:[91m 0.66214 [0m(+0.01852)


[4m[1m > EPOCH: 249/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:50:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07507 [0m(-0.00300)
     | > avg_loss:[91m 0.29292 [0m(+0.03195)
     | > avg_log_mle:[92m -0.40401 [0m(-0.00283)
     | > avg_loss_dur:[91m 0.69693 [0m(+0.03479)


[4m[1m > EPOCH: 250/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:51:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 4500[0m
     | > loss: -0.16315  (-0.16315)
     | > log_mle: -0.41517  (-0.41517)
     | > loss_dur: 0.25202  (0.25202)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.66337  (7.66337)
     | > current_lr: 0.00006 
     | > step_time: 0.50150  (0.50146)
     | > loader_time: 0.27120  (0.27125)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00300)
     | > avg_loss:[92m 0.25472 [0m(-0.03820)
     | > avg_log_mle:[91m -0.40230 [0m(+0.00170)
     | > avg_loss_dur:[92m 0.65703 [0m(-0.03990)


[4m[1m > EPOCH: 251/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:51:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 4525[0m
     | > loss: -0.02909  (-0.06767)
     | > log_mle: -0.40510  (-0.40385)
     | > loss_dur: 0.37601  (0.33618)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.10428  (5.52398)
     | > current_lr: 0.00006 
     | > step_time: 0.65260  (0.66089)
     | > loader_time: 0.43440  (0.41338)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.01001)
     | > avg_loss:[92m 0.23385 [0m(-0.02087)
     | > avg_log_mle:[91m -0.40184 [0m(+0.00046)
     | > avg_loss_dur:[92m 0.63569 [0m(-0.02134)


[4m[1m > EPOCH: 252/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:52:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 4550[0m
     | > loss: 0.06551  (-0.03332)
     | > log_mle: -0.38653  (-0.40193)
     | > loss_dur: 0.45204  (0.36861)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.74050  (8.38844)
     | > current_lr: 0.00006 
     | > step_time: 1.00690  (0.73882)
     | > loader_time: 0.63060  (0.46871)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08107 [0m(+0.01301)
     | > avg_loss:[91m 0.26699 [0m(+0.03313)
     | > avg_log_mle:[92m -0.41246 [0m(-0.01062)
     | > avg_loss_dur:[91m 0.67945 [0m(+0.04375)


[4m[1m > EPOCH: 253/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:52:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.01101)
     | > avg_loss:[92m 0.24316 [0m(-0.02383)
     | > avg_log_mle:[91m -0.40558 [0m(+0.00688)
     | > avg_loss_dur:[92m 0.64874 [0m(-0.03070)


[4m[1m > EPOCH: 254/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:53:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 4575[0m
     | > loss: -0.08263  (-0.10792)
     | > log_mle: -0.40935  (-0.41294)
     | > loss_dur: 0.32672  (0.30503)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.35126  (8.55722)
     | > current_lr: 0.00006 
     | > step_time: 0.68760  (0.63324)
     | > loader_time: 0.42540  (0.38101)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00000)
     | > avg_loss:[92m 0.22991 [0m(-0.01324)
     | > avg_log_mle:[91m -0.40196 [0m(+0.00363)
     | > avg_loss_dur:[92m 0.63187 [0m(-0.01687)


[4m[1m > EPOCH: 255/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:53:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 4600[0m
     | > loss: 0.00203  (-0.04728)
     | > log_mle: -0.38685  (-0.40189)
     | > loss_dur: 0.38888  (0.35461)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.79636  (8.82058)
     | > current_lr: 0.00006 
     | > step_time: 0.69960  (0.69173)
     | > loader_time: 0.47840  (0.43680)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[91m 0.23027 [0m(+0.00036)
     | > avg_log_mle:[92m -0.40559 [0m(-0.00363)
     | > avg_loss_dur:[91m 0.63586 [0m(+0.00399)


[4m[1m > EPOCH: 256/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:54:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 4625[0m
     | > loss: 0.07798  (-0.01725)
     | > log_mle: -0.39498  (-0.40093)
     | > loss_dur: 0.47296  (0.38368)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.76152  (7.49408)
     | > current_lr: 0.00006 
     | > step_time: 0.84480  (0.76376)
     | > loader_time: 0.39840  (0.46766)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00200)
     | > avg_loss:[92m 0.20391 [0m(-0.02636)
     | > avg_log_mle:[92m -0.41480 [0m(-0.00920)
     | > avg_loss_dur:[92m 0.61871 [0m(-0.01715)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_4626.pth

[4m[1m > EPOCH: 257/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:54:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[91m 0.22789 [0m(+0.02398)
     | > avg_log_mle:[91m -0.40402 [0m(+0.01078)
     | > avg_loss_dur:[91m 0.63191 [0m(+0.01320)


[4m[1m > EPOCH: 258/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:55:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 4650[0m
     | > loss: -0.06755  (-0.09043)
     | > log_mle: -0.39793  (-0.41126)
     | > loss_dur: 0.33038  (0.32084)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.14840  (7.78769)
     | > current_lr: 0.00006 
     | > step_time: 0.63460  (0.66694)
     | > loader_time: 0.37530  (0.42155)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[92m 0.20255 [0m(-0.02534)
     | > avg_log_mle:[92m -0.41015 [0m(-0.00613)
     | > avg_loss_dur:[92m 0.61270 [0m(-0.01921)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_4662.pth

[4m[1m > EPOCH: 259/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:56:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 4675[0m
     | > loss: 0.01722  (-0.05498)
     | > log_mle: -0.40348  (-0.41038)
     | > loss_dur: 0.42070  (0.35540)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.41298  (6.16577)
     | > current_lr: 0.00006 
     | > step_time: 0.78370  (0.71927)
     | > loader_time: 0.52450  (0.46203)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[91m 0.21581 [0m(+0.01326)
     | > avg_log_mle:[91m -0.40475 [0m(+0.00539)
     | > avg_loss_dur:[91m 0.62056 [0m(+0.00786)


[4m[1m > EPOCH: 260/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:56:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00000)
     | > avg_loss:[91m 0.22043 [0m(+0.00462)
     | > avg_log_mle:[92m -0.40884 [0m(-0.00409)
     | > avg_loss_dur:[91m 0.62927 [0m(+0.00871)


[4m[1m > EPOCH: 261/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:57:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 4700[0m
     | > loss: -0.09541  (-0.11811)
     | > log_mle: -0.41594  (-0.41560)
     | > loss_dur: 0.32053  (0.29748)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 25.76951  (31.35706)
     | > current_lr: 0.00007 
     | > step_time: 0.56050  (0.60855)
     | > loader_time: 0.33730  (0.36383)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00400)
     | > avg_loss:[91m 0.25886 [0m(+0.03843)
     | > avg_log_mle:[92m -0.40887 [0m(-0.00004)
     | > avg_loss_dur:[91m 0.66773 [0m(+0.03847)


[4m[1m > EPOCH: 262/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:57:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 4725[0m
     | > loss: -0.00515  (-0.05642)
     | > log_mle: -0.41503  (-0.41197)
     | > loss_dur: 0.40988  (0.35555)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.17395  (9.05125)
     | > current_lr: 0.00007 
     | > step_time: 0.87280  (0.68741)
     | > loader_time: 0.52450  (0.41838)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00901)
     | > avg_loss:[91m 0.27771 [0m(+0.01885)
     | > avg_log_mle:[92m -0.41058 [0m(-0.00170)
     | > avg_loss_dur:[91m 0.68829 [0m(+0.02055)


[4m[1m > EPOCH: 263/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:58:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 4750[0m
     | > loss: 0.09290  (-0.01567)
     | > log_mle: -0.38785  (-0.40272)
     | > loss_dur: 0.48075  (0.38705)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.94164  (12.87475)
     | > current_lr: 0.00007 
     | > step_time: 0.95290  (0.76251)
     | > loader_time: 0.60150  (0.48507)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00200)
     | > avg_loss:[92m 0.22790 [0m(-0.04981)
     | > avg_log_mle:[92m -0.41458 [0m(-0.00400)
     | > avg_loss_dur:[92m 0.64248 [0m(-0.04581)


[4m[1m > EPOCH: 264/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:58:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.01001)
     | > avg_loss:[92m 0.19599 [0m(-0.03191)
     | > avg_log_mle:[92m -0.41536 [0m(-0.00078)
     | > avg_loss_dur:[92m 0.61134 [0m(-0.03114)

 > BEST MODEL : ./output\run-September-15-2022_04+45AM-910d77a\best_model_4770.pth

[4m[1m > EPOCH: 265/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:59:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 4775[0m
     | > loss: -0.05702  (-0.11018)
     | > log_mle: -0.41016  (-0.41857)
     | > loss_dur: 0.35314  (0.30839)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.54775  (7.46219)
     | > current_lr: 0.00007 
     | > step_time: 0.74070  (0.67241)
     | > loader_time: 0.45840  (0.40657)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00500)
     | > avg_loss:[91m 0.21268 [0m(+0.01669)
     | > avg_log_mle:[91m -0.41475 [0m(+0.00061)
     | > avg_loss_dur:[91m 0.62743 [0m(+0.01608)


[4m[1m > EPOCH: 266/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 06:59:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 4800[0m
     | > loss: -0.01791  (-0.07998)
     | > log_mle: -0.41305  (-0.41499)
     | > loss_dur: 0.39514  (0.33500)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.12393  (7.95970)
     | > current_lr: 0.00007 
     | > step_time: 0.91180  (0.71657)
     | > loader_time: 0.62860  (0.45691)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[92m 0.21117 [0m(-0.00151)
     | > avg_log_mle:[91m -0.41464 [0m(+0.00011)
     | > avg_loss_dur:[92m 0.62581 [0m(-0.00161)


[4m[1m > EPOCH: 267/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:00:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00400)
     | > avg_loss:[91m 0.24196 [0m(+0.03079)
     | > avg_log_mle:[92m -0.41640 [0m(-0.00176)
     | > avg_loss_dur:[91m 0.65836 [0m(+0.03254)


[4m[1m > EPOCH: 268/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:00:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 4825[0m
     | > loss: -0.16673  (-0.16673)
     | > log_mle: -0.42201  (-0.42201)
     | > loss_dur: 0.25529  (0.25529)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.66236  (4.66236)
     | > current_lr: 0.00007 
     | > step_time: 0.64960  (0.64959)
     | > loader_time: 0.37130  (0.37134)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07106 [0m(+0.00000)
     | > avg_loss:[92m 0.22751 [0m(-0.01445)
     | > avg_log_mle:[91m -0.41227 [0m(+0.00413)
     | > avg_loss_dur:[92m 0.63978 [0m(-0.01858)


[4m[1m > EPOCH: 269/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:01:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 4850[0m
     | > loss: -0.05821  (-0.10647)
     | > log_mle: -0.41889  (-0.41685)
     | > loss_dur: 0.36068  (0.31038)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.97883  (6.55490)
     | > current_lr: 0.00007 
     | > step_time: 0.67660  (0.66235)
     | > loader_time: 0.38330  (0.40462)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00701)
     | > avg_loss:[91m 0.26097 [0m(+0.03346)
     | > avg_log_mle:[92m -0.41271 [0m(-0.00044)
     | > avg_loss_dur:[91m 0.67367 [0m(+0.03389)


[4m[1m > EPOCH: 270/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:01:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 4875[0m
     | > loss: 0.00565  (-0.06543)
     | > log_mle: -0.40384  (-0.40932)
     | > loss_dur: 0.40949  (0.34390)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 2.98600  (8.21501)
     | > current_lr: 0.00007 
     | > step_time: 0.87480  (0.74962)
     | > loader_time: 0.57850  (0.46776)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00500)
     | > avg_loss:[92m 0.23671 [0m(-0.02425)
     | > avg_log_mle:[92m -0.41685 [0m(-0.00414)
     | > avg_loss_dur:[92m 0.65356 [0m(-0.02011)


[4m[1m > EPOCH: 271/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:02:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00400)
     | > avg_loss:[92m 0.23380 [0m(-0.00291)
     | > avg_log_mle:[92m -0.41890 [0m(-0.00205)
     | > avg_loss_dur:[92m 0.65270 [0m(-0.00087)


[4m[1m > EPOCH: 272/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:02:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 4900[0m
     | > loss: -0.12059  (-0.14614)
     | > log_mle: -0.41911  (-0.42482)
     | > loss_dur: 0.29852  (0.27868)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.74778  (8.47989)
     | > current_lr: 0.00007 
     | > step_time: 0.73070  (0.65660)
     | > loader_time: 0.48140  (0.41587)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07005 [0m(+0.00499)
     | > avg_loss:[92m 0.21861 [0m(-0.01519)
     | > avg_log_mle:[91m -0.41735 [0m(+0.00155)
     | > avg_loss_dur:[92m 0.63596 [0m(-0.01674)


[4m[1m > EPOCH: 273/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:03:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 4925[0m
     | > loss: -0.07924  (-0.10448)
     | > log_mle: -0.41717  (-0.42018)
     | > loss_dur: 0.33792  (0.31570)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.18096  (9.99845)
     | > current_lr: 0.00007 
     | > step_time: 0.73470  (0.69445)
     | > loader_time: 0.43640  (0.42775)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00299)
     | > avg_loss:[91m 0.22670 [0m(+0.00810)
     | > avg_log_mle:[92m -0.41832 [0m(-0.00097)
     | > avg_loss_dur:[91m 0.64503 [0m(+0.00907)


[4m[1m > EPOCH: 274/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:03:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07506 [0m(+0.00800)
     | > avg_loss:[91m 0.25091 [0m(+0.02421)
     | > avg_log_mle:[92m -0.42016 [0m(-0.00184)
     | > avg_loss_dur:[91m 0.67107 [0m(+0.02605)


[4m[1m > EPOCH: 275/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:04:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 4950[0m
     | > loss: -0.21345  (-0.21345)
     | > log_mle: -0.43949  (-0.43949)
     | > loss_dur: 0.22604  (0.22604)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.06597  (4.06597)
     | > current_lr: 0.00007 
     | > step_time: 0.61160  (0.61156)
     | > loader_time: 0.25520  (0.25522)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06805 [0m(-0.00701)
     | > avg_loss:[92m 0.24928 [0m(-0.00163)
     | > avg_log_mle:[91m -0.40621 [0m(+0.01395)
     | > avg_loss_dur:[92m 0.65549 [0m(-0.01558)


[4m[1m > EPOCH: 276/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:05:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 4975[0m
     | > loss: -0.06474  (-0.11134)
     | > log_mle: -0.41525  (-0.41573)
     | > loss_dur: 0.35051  (0.30439)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.22609  (7.87138)
     | > current_lr: 0.00007 
     | > step_time: 0.65560  (0.66590)
     | > loader_time: 0.41440  (0.39693)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06905 [0m(+0.00100)
     | > avg_loss:[92m 0.23853 [0m(-0.01075)
     | > avg_log_mle:[92m -0.41464 [0m(-0.00842)
     | > avg_loss_dur:[92m 0.65317 [0m(-0.00233)


[4m[1m > EPOCH: 277/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:05:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 5000[0m
     | > loss: 0.01780  (-0.08602)
     | > log_mle: -0.39813  (-0.41699)
     | > loss_dur: 0.41594  (0.33097)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 9.84264  (10.54553)
     | > current_lr: 0.00007 
     | > step_time: 1.01490  (0.74233)
     | > loader_time: 0.65760  (0.47207)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00399)
     | > avg_loss:[91m 0.24765 [0m(+0.00912)
     | > avg_log_mle:[92m -0.41899 [0m(-0.00436)
     | > avg_loss_dur:[91m 0.66664 [0m(+0.01347)


[4m[1m > EPOCH: 278/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:06:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00300)
     | > avg_loss:[91m 0.25352 [0m(+0.00588)
     | > avg_log_mle:[92m -0.42258 [0m(-0.00359)
     | > avg_loss_dur:[91m 0.67611 [0m(+0.00947)


[4m[1m > EPOCH: 279/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:06:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 5025[0m
     | > loss: -0.14114  (-0.16439)
     | > log_mle: -0.43148  (-0.43356)
     | > loss_dur: 0.29034  (0.26917)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.61355  (8.50537)
     | > current_lr: 0.00007 
     | > step_time: 0.68760  (0.63625)
     | > loader_time: 0.42040  (0.37868)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06005 [0m(-0.00801)
     | > avg_loss:[92m 0.25127 [0m(-0.00225)
     | > avg_log_mle:[92m -0.42389 [0m(-0.00131)
     | > avg_loss_dur:[92m 0.67516 [0m(-0.00095)


[4m[1m > EPOCH: 280/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:07:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 5050[0m
     | > loss: -0.06096  (-0.11255)
     | > log_mle: -0.40513  (-0.42514)
     | > loss_dur: 0.34417  (0.31259)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.56412  (6.82881)
     | > current_lr: 0.00007 
     | > step_time: 0.69660  (0.69013)
     | > loader_time: 0.42040  (0.44891)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.01101)
     | > avg_loss:[92m 0.21568 [0m(-0.03560)
     | > avg_log_mle:[91m -0.41670 [0m(+0.00719)
     | > avg_loss_dur:[92m 0.63237 [0m(-0.04279)


[4m[1m > EPOCH: 281/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:07:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 5075[0m
     | > loss: -0.00178  (-0.07055)
     | > log_mle: -0.41190  (-0.41816)
     | > loss_dur: 0.41013  (0.34761)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.93922  (8.16409)
     | > current_lr: 0.00007 
     | > step_time: 0.85380  (0.77011)
     | > loader_time: 0.41940  (0.48538)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00300)
     | > avg_loss:[91m 0.29228 [0m(+0.07660)
     | > avg_log_mle:[91m -0.39890 [0m(+0.01780)
     | > avg_loss_dur:[91m 0.69117 [0m(+0.05880)


[4m[1m > EPOCH: 282/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:08:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00500)
     | > avg_loss:[92m 0.22411 [0m(-0.06817)
     | > avg_log_mle:[92m -0.42129 [0m(-0.02240)
     | > avg_loss_dur:[92m 0.64540 [0m(-0.04577)


[4m[1m > EPOCH: 283/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:08:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 5100[0m
     | > loss: -0.09550  (-0.13455)
     | > log_mle: -0.40561  (-0.42043)
     | > loss_dur: 0.31011  (0.28587)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 19.12764  (15.71992)
     | > current_lr: 0.00007 
     | > step_time: 0.64460  (0.66978)
     | > loader_time: 0.39840  (0.41588)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00400)
     | > avg_loss:[91m 0.27122 [0m(+0.04711)
     | > avg_log_mle:[91m -0.40839 [0m(+0.01291)
     | > avg_loss_dur:[91m 0.67961 [0m(+0.03421)


[4m[1m > EPOCH: 284/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:09:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 5125[0m
     | > loss: -0.01506  (-0.10120)
     | > log_mle: -0.41334  (-0.42265)
     | > loss_dur: 0.39828  (0.32144)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.19184  (10.84670)
     | > current_lr: 0.00007 
     | > step_time: 0.78170  (0.71981)
     | > loader_time: 0.48840  (0.46249)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.00801)
     | > avg_loss:[92m 0.22156 [0m(-0.04967)
     | > avg_log_mle:[92m -0.42168 [0m(-0.01329)
     | > avg_loss_dur:[92m 0.64323 [0m(-0.03638)


[4m[1m > EPOCH: 285/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:09:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00901)
     | > avg_loss:[91m 0.25584 [0m(+0.03428)
     | > avg_log_mle:[92m -0.42246 [0m(-0.00078)
     | > avg_loss_dur:[91m 0.67829 [0m(+0.03506)


[4m[1m > EPOCH: 286/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:10:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 5150[0m
     | > loss: -0.19000  (-0.18597)
     | > log_mle: -0.44161  (-0.43713)
     | > loss_dur: 0.25162  (0.25116)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.91574  (7.87870)
     | > current_lr: 0.00007 
     | > step_time: 0.56350  (0.61406)
     | > loader_time: 0.33130  (0.35782)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00100)
     | > avg_loss:[92m 0.23215 [0m(-0.02368)
     | > avg_log_mle:[92m -0.42421 [0m(-0.00175)
     | > avg_loss_dur:[92m 0.65636 [0m(-0.02193)


[4m[1m > EPOCH: 287/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:10:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 5175[0m
     | > loss: -0.10220  (-0.13395)
     | > log_mle: -0.43389  (-0.43220)
     | > loss_dur: 0.33169  (0.29825)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.73935  (10.05819)
     | > current_lr: 0.00007 
     | > step_time: 0.87180  (0.69096)
     | > loader_time: 0.62860  (0.43973)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00000)
     | > avg_loss:[92m 0.20854 [0m(-0.02361)
     | > avg_log_mle:[92m -0.42802 [0m(-0.00382)
     | > avg_loss_dur:[92m 0.63657 [0m(-0.01980)


[4m[1m > EPOCH: 288/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:11:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 5200[0m
     | > loss: 0.03691  (-0.09404)
     | > log_mle: -0.40291  (-0.42502)
     | > loss_dur: 0.43982  (0.33099)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 9.29196  (9.43597)
     | > current_lr: 0.00007 
     | > step_time: 0.94890  (0.76369)
     | > loader_time: 0.60350  (0.47956)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08107 [0m(+0.01201)
     | > avg_loss:[91m 0.24339 [0m(+0.03485)
     | > avg_log_mle:[92m -0.42846 [0m(-0.00044)
     | > avg_loss_dur:[91m 0.67186 [0m(+0.03529)


[4m[1m > EPOCH: 289/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:11:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.01601)
     | > avg_loss:[92m 0.23553 [0m(-0.00786)
     | > avg_log_mle:[91m -0.42662 [0m(+0.00184)
     | > avg_loss_dur:[92m 0.66215 [0m(-0.00971)


[4m[1m > EPOCH: 290/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:12:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 5225[0m
     | > loss: -0.12405  (-0.17268)
     | > log_mle: -0.42567  (-0.43466)
     | > loss_dur: 0.30161  (0.26198)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.93700  (9.21059)
     | > current_lr: 0.00007 
     | > step_time: 0.73670  (0.67582)
     | > loader_time: 0.41840  (0.40697)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00300)
     | > avg_loss:[91m 0.27201 [0m(+0.03648)
     | > avg_log_mle:[91m -0.41516 [0m(+0.01146)
     | > avg_loss_dur:[91m 0.68717 [0m(+0.02502)


[4m[1m > EPOCH: 291/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:12:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 5250[0m
     | > loss: -0.04067  (-0.12054)
     | > log_mle: -0.41898  (-0.42513)
     | > loss_dur: 0.37831  (0.30460)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.10467  (9.31843)
     | > current_lr: 0.00007 
     | > step_time: 0.92480  (0.71240)
     | > loader_time: 0.62460  (0.44182)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[92m 0.24477 [0m(-0.02725)
     | > avg_log_mle:[92m -0.41689 [0m(-0.00173)
     | > avg_loss_dur:[92m 0.66165 [0m(-0.02552)


[4m[1m > EPOCH: 292/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:13:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[92m 0.20732 [0m(-0.03745)
     | > avg_log_mle:[92m -0.42112 [0m(-0.00423)
     | > avg_loss_dur:[92m 0.62844 [0m(-0.03321)


[4m[1m > EPOCH: 293/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:13:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 5275[0m
     | > loss: -0.20908  (-0.20908)
     | > log_mle: -0.43578  (-0.43578)
     | > loss_dur: 0.22670  (0.22670)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.41772  (4.41772)
     | > current_lr: 0.00007 
     | > step_time: 0.64460  (0.64459)
     | > loader_time: 0.40140  (0.40136)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00400)
     | > avg_loss:[91m 0.26631 [0m(+0.05899)
     | > avg_log_mle:[92m -0.42413 [0m(-0.00301)
     | > avg_loss_dur:[91m 0.69044 [0m(+0.06200)


[4m[1m > EPOCH: 294/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:14:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 5300[0m
     | > loss: -0.11988  (-0.15044)
     | > log_mle: -0.43426  (-0.43308)
     | > loss_dur: 0.31438  (0.28264)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.35671  (7.90039)
     | > current_lr: 0.00007 
     | > step_time: 0.68560  (0.66861)
     | > loader_time: 0.43740  (0.41913)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06506 [0m(+0.00200)
     | > avg_loss:[92m 0.25865 [0m(-0.00766)
     | > avg_log_mle:[91m -0.41416 [0m(+0.00997)
     | > avg_loss_dur:[92m 0.67281 [0m(-0.01764)


[4m[1m > EPOCH: 295/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:14:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 5325[0m
     | > loss: -0.04281  (-0.10724)
     | > log_mle: -0.41813  (-0.42581)
     | > loss_dur: 0.37532  (0.31857)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.52906  (6.48642)
     | > current_lr: 0.00007 
     | > step_time: 0.87880  (0.74761)
     | > loader_time: 0.53150  (0.47837)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00100)
     | > avg_loss:[92m 0.25096 [0m(-0.00769)
     | > avg_log_mle:[92m -0.42639 [0m(-0.01223)
     | > avg_loss_dur:[91m 0.67735 [0m(+0.00454)


[4m[1m > EPOCH: 296/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:15:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[91m 0.29511 [0m(+0.04415)
     | > avg_log_mle:[91m -0.41400 [0m(+0.01238)
     | > avg_loss_dur:[91m 0.70912 [0m(+0.03177)


[4m[1m > EPOCH: 297/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:16:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 5350[0m
     | > loss: -0.11241  (-0.17717)
     | > log_mle: -0.41560  (-0.43143)
     | > loss_dur: 0.30319  (0.25426)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 9.32425  (9.10119)
     | > current_lr: 0.00007 
     | > step_time: 0.73070  (0.65560)
     | > loader_time: 0.49850  (0.39186)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00100)
     | > avg_loss:[92m 0.26754 [0m(-0.02757)
     | > avg_log_mle:[92m -0.41878 [0m(-0.00478)
     | > avg_loss_dur:[92m 0.68632 [0m(-0.02280)


[4m[1m > EPOCH: 298/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:16:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 5375[0m
     | > loss: -0.09001  (-0.13893)
     | > log_mle: -0.42932  (-0.42897)
     | > loss_dur: 0.33931  (0.29004)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.26015  (12.03500)
     | > current_lr: 0.00007 
     | > step_time: 0.73670  (0.69745)
     | > loader_time: 0.43440  (0.43540)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00200)
     | > avg_loss:[92m 0.24565 [0m(-0.02189)
     | > avg_log_mle:[92m -0.42627 [0m(-0.00749)
     | > avg_loss_dur:[92m 0.67192 [0m(-0.01439)


[4m[1m > EPOCH: 299/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:17:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08308 [0m(+0.01702)
     | > avg_loss:[92m 0.23805 [0m(-0.00760)
     | > avg_log_mle:[92m -0.42947 [0m(-0.00320)
     | > avg_loss_dur:[92m 0.66753 [0m(-0.00440)


[4m[1m > EPOCH: 300/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:17:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 5400[0m
     | > loss: -0.24757  (-0.24757)
     | > log_mle: -0.45382  (-0.45382)
     | > loss_dur: 0.20625  (0.20625)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.14204  (10.14204)
     | > current_lr: 0.00007 
     | > step_time: 0.50350  (0.50346)
     | > loader_time: 0.29330  (0.29325)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07407 [0m(-0.00901)
     | > avg_loss:[91m 0.25265 [0m(+0.01460)
     | > avg_log_mle:[91m -0.42186 [0m(+0.00762)
     | > avg_loss_dur:[91m 0.67450 [0m(+0.00698)


[4m[1m > EPOCH: 301/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:18:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 5425[0m
     | > loss: -0.12864  (-0.17397)
     | > log_mle: -0.43922  (-0.43962)
     | > loss_dur: 0.31057  (0.26565)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 19.13403  (11.95430)
     | > current_lr: 0.00008 
     | > step_time: 0.64660  (0.66704)
     | > loader_time: 0.40240  (0.42153)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00901)
     | > avg_loss:[92m 0.25200 [0m(-0.00065)
     | > avg_log_mle:[92m -0.43043 [0m(-0.00858)
     | > avg_loss_dur:[91m 0.68244 [0m(+0.00793)


[4m[1m > EPOCH: 302/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:18:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 5450[0m
     | > loss: -0.02720  (-0.13690)
     | > log_mle: -0.41000  (-0.43545)
     | > loss_dur: 0.38280  (0.29855)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 16.51401  (11.85358)
     | > current_lr: 0.00008 
     | > step_time: 1.01390  (0.74253)
     | > loader_time: 0.61460  (0.47450)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00801)
     | > avg_loss:[91m 0.27380 [0m(+0.02180)
     | > avg_log_mle:[91m -0.42284 [0m(+0.00759)
     | > avg_loss_dur:[91m 0.69664 [0m(+0.01420)


[4m[1m > EPOCH: 303/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:19:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06605 [0m(-0.00702)
     | > avg_loss:[91m 0.28338 [0m(+0.00958)
     | > avg_log_mle:[91m -0.39604 [0m(+0.02680)
     | > avg_loss_dur:[92m 0.67942 [0m(-0.01722)


[4m[1m > EPOCH: 304/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:19:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 5475[0m
     | > loss: -0.17082  (-0.19874)
     | > log_mle: -0.43346  (-0.43556)
     | > loss_dur: 0.26264  (0.23682)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.99555  (7.02689)
     | > current_lr: 0.00008 
     | > step_time: 0.68760  (0.63191)
     | > loader_time: 0.44240  (0.40270)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06805 [0m(+0.00200)
     | > avg_loss:[92m 0.23553 [0m(-0.04785)
     | > avg_log_mle:[92m -0.42647 [0m(-0.03043)
     | > avg_loss_dur:[92m 0.66200 [0m(-0.01742)


[4m[1m > EPOCH: 305/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:20:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 5500[0m
     | > loss: -0.13735  (-0.15491)
     | > log_mle: -0.41969  (-0.43457)
     | > loss_dur: 0.28234  (0.27966)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.09907  (11.53199)
     | > current_lr: 0.00008 
     | > step_time: 0.70760  (0.69644)
     | > loader_time: 0.45940  (0.44570)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00301)
     | > avg_loss:[91m 0.25699 [0m(+0.02146)
     | > avg_log_mle:[91m -0.42437 [0m(+0.00210)
     | > avg_loss_dur:[91m 0.68136 [0m(+0.01936)


[4m[1m > EPOCH: 306/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:20:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 5525[0m
     | > loss: -0.05158  (-0.09919)
     | > log_mle: -0.42470  (-0.42429)
     | > loss_dur: 0.37312  (0.32511)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.55048  (11.22268)
     | > current_lr: 0.00008 
     | > step_time: 0.85080  (0.76811)
     | > loader_time: 0.38740  (0.46790)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00300)
     | > avg_loss:[91m 0.27303 [0m(+0.01604)
     | > avg_log_mle:[91m -0.42235 [0m(+0.00202)
     | > avg_loss_dur:[91m 0.69539 [0m(+0.01403)


[4m[1m > EPOCH: 307/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:21:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00000)
     | > avg_loss:[92m 0.23911 [0m(-0.03392)
     | > avg_log_mle:[92m -0.42308 [0m(-0.00072)
     | > avg_loss_dur:[92m 0.66219 [0m(-0.03320)


[4m[1m > EPOCH: 308/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:21:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 5550[0m
     | > loss: -0.09521  (-0.17573)
     | > log_mle: -0.41243  (-0.43693)
     | > loss_dur: 0.31722  (0.26119)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.58707  (11.12192)
     | > current_lr: 0.00008 
     | > step_time: 0.63660  (0.66694)
     | > loader_time: 0.37930  (0.44440)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00500)
     | > avg_loss:[92m 0.22131 [0m(-0.01780)
     | > avg_log_mle:[92m -0.42812 [0m(-0.00505)
     | > avg_loss_dur:[92m 0.64944 [0m(-0.01275)


[4m[1m > EPOCH: 309/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:22:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 5575[0m
     | > loss: -0.03085  (-0.13532)
     | > log_mle: -0.42096  (-0.43094)
     | > loss_dur: 0.39011  (0.29562)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.02357  (10.46569)
     | > current_lr: 0.00008 
     | > step_time: 0.77970  (0.71927)
     | > loader_time: 0.48540  (0.45418)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[91m 0.28582 [0m(+0.06451)
     | > avg_log_mle:[91m -0.42206 [0m(+0.00606)
     | > avg_loss_dur:[91m 0.70788 [0m(+0.05845)


[4m[1m > EPOCH: 310/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:22:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00601)
     | > avg_loss:[92m 0.22858 [0m(-0.05724)
     | > avg_log_mle:[92m -0.42245 [0m(-0.00039)
     | > avg_loss_dur:[92m 0.65103 [0m(-0.05685)


[4m[1m > EPOCH: 311/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:23:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 5600[0m
     | > loss: -0.24835  (-0.25341)
     | > log_mle: -0.45610  (-0.45354)
     | > loss_dur: 0.20776  (0.20014)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.87181  (3.76680)
     | > current_lr: 0.00008 
     | > step_time: 0.55250  (0.60155)
     | > loader_time: 0.32830  (0.35632)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00000)
     | > avg_loss:[91m 0.26262 [0m(+0.03404)
     | > avg_log_mle:[92m -0.42394 [0m(-0.00150)
     | > avg_loss_dur:[91m 0.68656 [0m(+0.03553)


[4m[1m > EPOCH: 312/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:24:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 5625[0m
     | > loss: -0.12239  (-0.17028)
     | > log_mle: -0.44310  (-0.44238)
     | > loss_dur: 0.32072  (0.27210)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.45404  (10.56869)
     | > current_lr: 0.00008 
     | > step_time: 0.87180  (0.68741)
     | > loader_time: 0.56250  (0.41693)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00500)
     | > avg_loss:[91m 0.30565 [0m(+0.04303)
     | > avg_log_mle:[92m -0.42776 [0m(-0.00381)
     | > avg_loss_dur:[91m 0.73341 [0m(+0.04684)


[4m[1m > EPOCH: 313/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:24:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 5650[0m
     | > loss: -0.01902  (-0.12235)
     | > log_mle: -0.41224  (-0.43201)
     | > loss_dur: 0.39322  (0.30966)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.75299  (12.29183)
     | > current_lr: 0.00008 
     | > step_time: 0.95290  (0.76420)
     | > loader_time: 0.61760  (0.49076)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00400)
     | > avg_loss:[92m 0.27014 [0m(-0.03551)
     | > avg_log_mle:[91m -0.42482 [0m(+0.00293)
     | > avg_loss_dur:[92m 0.69496 [0m(-0.03845)


[4m[1m > EPOCH: 314/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:25:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[91m 0.27898 [0m(+0.00884)
     | > avg_log_mle:[92m -0.43190 [0m(-0.00708)
     | > avg_loss_dur:[91m 0.71088 [0m(+0.01592)


[4m[1m > EPOCH: 315/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:25:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 5675[0m
     | > loss: -0.16258  (-0.20597)
     | > log_mle: -0.43716  (-0.44644)
     | > loss_dur: 0.27458  (0.24046)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.39295  (11.29938)
     | > current_lr: 0.00008 
     | > step_time: 0.73870  (0.67421)
     | > loader_time: 0.41140  (0.44140)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00400)
     | > avg_loss:[92m 0.27578 [0m(-0.00320)
     | > avg_log_mle:[91m -0.41294 [0m(+0.01896)
     | > avg_loss_dur:[92m 0.68872 [0m(-0.02216)


[4m[1m > EPOCH: 316/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:26:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 5700[0m
     | > loss: -0.07519  (-0.14957)
     | > log_mle: -0.43283  (-0.43713)
     | > loss_dur: 0.35764  (0.28756)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.77823  (11.78836)
     | > current_lr: 0.00008 
     | > step_time: 0.91380  (0.71490)
     | > loader_time: 0.64060  (0.45116)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00100)
     | > avg_loss:[92m 0.22345 [0m(-0.05233)
     | > avg_log_mle:[92m -0.42108 [0m(-0.00814)
     | > avg_loss_dur:[92m 0.64453 [0m(-0.04419)


[4m[1m > EPOCH: 317/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:26:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00000)
     | > avg_loss:[92m 0.21603 [0m(-0.00741)
     | > avg_log_mle:[92m -0.42812 [0m(-0.00704)
     | > avg_loss_dur:[92m 0.64415 [0m(-0.00038)


[4m[1m > EPOCH: 318/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:27:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 5725[0m
     | > loss: -0.23768  (-0.23768)
     | > log_mle: -0.45058  (-0.45058)
     | > loss_dur: 0.21290  (0.21290)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.41628  (6.41628)
     | > current_lr: 0.00008 
     | > step_time: 0.65360  (0.65360)
     | > loader_time: 0.38130  (0.38135)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[91m 0.24619 [0m(+0.03016)
     | > avg_log_mle:[91m -0.41980 [0m(+0.00832)
     | > avg_loss_dur:[91m 0.66599 [0m(+0.02184)


[4m[1m > EPOCH: 319/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:27:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 5750[0m
     | > loss: -0.16403  (-0.18059)
     | > log_mle: -0.45208  (-0.44650)
     | > loss_dur: 0.28805  (0.26591)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.79255  (7.12118)
     | > current_lr: 0.00008 
     | > step_time: 0.68060  (0.66736)
     | > loader_time: 0.42440  (0.41212)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00100)
     | > avg_loss:[92m 0.23529 [0m(-0.01090)
     | > avg_log_mle:[91m -0.40654 [0m(+0.01326)
     | > avg_loss_dur:[92m 0.64183 [0m(-0.02416)


[4m[1m > EPOCH: 320/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:28:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 5775[0m
     | > loss: 0.02890  (-0.10116)
     | > log_mle: -0.38809  (-0.42094)
     | > loss_dur: 0.41699  (0.31978)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.06544  (13.95732)
     | > current_lr: 0.00008 
     | > step_time: 0.87580  (0.75102)
     | > loader_time: 0.52850  (0.46515)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.01001)
     | > avg_loss:[91m 0.27712 [0m(+0.04184)
     | > avg_log_mle:[92m -0.41263 [0m(-0.00609)
     | > avg_loss_dur:[91m 0.68976 [0m(+0.04793)


[4m[1m > EPOCH: 321/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:28:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00200)
     | > avg_loss:[92m 0.24495 [0m(-0.03217)
     | > avg_log_mle:[92m -0.42581 [0m(-0.01318)
     | > avg_loss_dur:[92m 0.67076 [0m(-0.01899)


[4m[1m > EPOCH: 322/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:29:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 5800[0m
     | > loss: -0.18151  (-0.20777)
     | > log_mle: -0.44469  (-0.44733)
     | > loss_dur: 0.26318  (0.23956)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 3.73304  (5.79498)
     | > current_lr: 0.00008 
     | > step_time: 0.72970  (0.65935)
     | > loader_time: 0.45640  (0.39085)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[92m 0.23246 [0m(-0.01249)
     | > avg_log_mle:[92m -0.43748 [0m(-0.01167)
     | > avg_loss_dur:[92m 0.66995 [0m(-0.00082)


[4m[1m > EPOCH: 323/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:29:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 5825[0m
     | > loss: -0.15435  (-0.17350)
     | > log_mle: -0.44602  (-0.44234)
     | > loss_dur: 0.29167  (0.26884)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.17080  (14.69082)
     | > current_lr: 0.00008 
     | > step_time: 0.73670  (0.69363)
     | > loader_time: 0.41540  (0.43940)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[92m 0.22101 [0m(-0.01145)
     | > avg_log_mle:[91m -0.43314 [0m(+0.00434)
     | > avg_loss_dur:[92m 0.65415 [0m(-0.01580)


[4m[1m > EPOCH: 324/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:30:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00500)
     | > avg_loss:[92m 0.21769 [0m(-0.00331)
     | > avg_log_mle:[92m -0.43459 [0m(-0.00145)
     | > avg_loss_dur:[92m 0.65228 [0m(-0.00187)


[4m[1m > EPOCH: 325/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:30:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 5850[0m
     | > loss: -0.28439  (-0.28439)
     | > log_mle: -0.46999  (-0.46999)
     | > loss_dur: 0.18560  (0.18560)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 26.19923  (26.19923)
     | > current_lr: 0.00008 
     | > step_time: 0.60660  (0.60655)
     | > loader_time: 0.26620  (0.26623)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00100)
     | > avg_loss:[91m 0.24957 [0m(+0.03187)
     | > avg_log_mle:[92m -0.43806 [0m(-0.00347)
     | > avg_loss_dur:[91m 0.68763 [0m(+0.03534)


[4m[1m > EPOCH: 326/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:31:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 5875[0m
     | > loss: -0.16593  (-0.21271)
     | > log_mle: -0.45098  (-0.45478)
     | > loss_dur: 0.28505  (0.24207)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.05800  (12.94627)
     | > current_lr: 0.00008 
     | > step_time: 0.64860  (0.66575)
     | > loader_time: 0.42440  (0.41094)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00701)
     | > avg_loss:[92m 0.24318 [0m(-0.00638)
     | > avg_log_mle:[91m -0.43802 [0m(+0.00004)
     | > avg_loss_dur:[92m 0.68121 [0m(-0.00642)


[4m[1m > EPOCH: 327/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:31:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 5900[0m
     | > loss: -0.07807  (-0.17935)
     | > log_mle: -0.42674  (-0.44826)
     | > loss_dur: 0.34867  (0.26891)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.85357  (13.50680)
     | > current_lr: 0.00008 
     | > step_time: 1.02490  (0.74368)
     | > loader_time: 0.63860  (0.47007)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00300)
     | > avg_loss:[92m 0.23864 [0m(-0.00455)
     | > avg_log_mle:[91m -0.43576 [0m(+0.00227)
     | > avg_loss_dur:[92m 0.67439 [0m(-0.00681)


[4m[1m > EPOCH: 328/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:32:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[92m 0.22284 [0m(-0.01579)
     | > avg_log_mle:[92m -0.43780 [0m(-0.00204)
     | > avg_loss_dur:[92m 0.66064 [0m(-0.01375)


[4m[1m > EPOCH: 329/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:33:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 5925[0m
     | > loss: -0.26025  (-0.27034)
     | > log_mle: -0.46558  (-0.46697)
     | > loss_dur: 0.20533  (0.19663)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.85626  (6.53700)
     | > current_lr: 0.00008 
     | > step_time: 0.67960  (0.63124)
     | > loader_time: 0.40540  (0.37868)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00100)
     | > avg_loss:[91m 0.24591 [0m(+0.02306)
     | > avg_log_mle:[91m -0.41916 [0m(+0.01864)
     | > avg_loss_dur:[91m 0.66507 [0m(+0.00443)


[4m[1m > EPOCH: 330/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:33:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 5950[0m
     | > loss: -0.13720  (-0.17273)
     | > log_mle: -0.41879  (-0.43673)
     | > loss_dur: 0.28159  (0.26400)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.92873  (14.37081)
     | > current_lr: 0.00008 
     | > step_time: 0.69860  (0.69073)
     | > loader_time: 0.41740  (0.42489)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00400)
     | > avg_loss:[91m 0.25896 [0m(+0.01305)
     | > avg_log_mle:[92m -0.42302 [0m(-0.00386)
     | > avg_loss_dur:[91m 0.68198 [0m(+0.01691)


[4m[1m > EPOCH: 331/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:34:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 5975[0m
     | > loss: -0.08214  (-0.15965)
     | > log_mle: -0.43792  (-0.44368)
     | > loss_dur: 0.35579  (0.28403)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.07610  (12.55827)
     | > current_lr: 0.00008 
     | > step_time: 0.85080  (0.76987)
     | > loader_time: 0.44540  (0.48850)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00501)
     | > avg_loss:[91m 0.26167 [0m(+0.00271)
     | > avg_log_mle:[92m -0.42400 [0m(-0.00098)
     | > avg_loss_dur:[91m 0.68567 [0m(+0.00369)


[4m[1m > EPOCH: 332/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:34:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00701)
     | > avg_loss:[91m 0.26811 [0m(+0.00644)
     | > avg_log_mle:[92m -0.43894 [0m(-0.01495)
     | > avg_loss_dur:[91m 0.70706 [0m(+0.02139)


[4m[1m > EPOCH: 333/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:35:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 6000[0m
     | > loss: -0.16655  (-0.21948)
     | > log_mle: -0.43576  (-0.45284)
     | > loss_dur: 0.26921  (0.23336)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 3.51858  (11.53892)
     | > current_lr: 0.00008 
     | > step_time: 0.63160  (0.66861)
     | > loader_time: 0.39240  (0.41988)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00801)
     | > avg_loss:[91m 0.26891 [0m(+0.00080)
     | > avg_log_mle:[91m -0.43578 [0m(+0.00316)
     | > avg_loss_dur:[92m 0.70469 [0m(-0.00237)


[4m[1m > EPOCH: 334/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:35:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 6025[0m
     | > loss: -0.08158  (-0.19227)
     | > log_mle: -0.43719  (-0.45256)
     | > loss_dur: 0.35561  (0.26029)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 24.39297  (12.36901)
     | > current_lr: 0.00008 
     | > step_time: 0.78470  (0.71850)
     | > loader_time: 0.48440  (0.46396)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00200)
     | > avg_loss:[91m 0.27239 [0m(+0.00348)
     | > avg_log_mle:[91m -0.43321 [0m(+0.00257)
     | > avg_loss_dur:[91m 0.70560 [0m(+0.00091)


[4m[1m > EPOCH: 335/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:36:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00601)
     | > avg_loss:[91m 0.30437 [0m(+0.03198)
     | > avg_log_mle:[91m -0.42499 [0m(+0.00822)
     | > avg_loss_dur:[91m 0.72936 [0m(+0.02376)


[4m[1m > EPOCH: 336/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:36:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 6050[0m
     | > loss: -0.28323  (-0.28205)
     | > log_mle: -0.46790  (-0.46730)
     | > loss_dur: 0.18467  (0.18525)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.37506  (7.76049)
     | > current_lr: 0.00008 
     | > step_time: 0.56350  (0.60655)
     | > loader_time: 0.34230  (0.35382)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00100)
     | > avg_loss:[92m 0.26105 [0m(-0.04333)
     | > avg_log_mle:[92m -0.43452 [0m(-0.00954)
     | > avg_loss_dur:[92m 0.69557 [0m(-0.03379)


[4m[1m > EPOCH: 337/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:37:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 6075[0m
     | > loss: -0.17885  (-0.20859)
     | > log_mle: -0.45752  (-0.45424)
     | > loss_dur: 0.27867  (0.24565)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.42431  (13.63120)
     | > current_lr: 0.00008 
     | > step_time: 0.87280  (0.69074)
     | > loader_time: 0.57950  (0.43617)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00200)
     | > avg_loss:[91m 0.27706 [0m(+0.01601)
     | > avg_log_mle:[91m -0.43372 [0m(+0.00081)
     | > avg_loss_dur:[91m 0.71077 [0m(+0.01520)


[4m[1m > EPOCH: 338/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:37:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 6100[0m
     | > loss: -0.08476  (-0.18195)
     | > log_mle: -0.43114  (-0.45198)
     | > loss_dur: 0.34638  (0.27003)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.04576  (9.16127)
     | > current_lr: 0.00008 
     | > step_time: 0.95090  (0.76269)
     | > loader_time: 0.57050  (0.47230)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00100)
     | > avg_loss:[92m 0.24358 [0m(-0.03348)
     | > avg_log_mle:[92m -0.43953 [0m(-0.00581)
     | > avg_loss_dur:[92m 0.68311 [0m(-0.02766)


[4m[1m > EPOCH: 339/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:38:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00500)
     | > avg_loss:[92m 0.23773 [0m(-0.00585)
     | > avg_log_mle:[91m -0.43280 [0m(+0.00673)
     | > avg_loss_dur:[92m 0.67053 [0m(-0.01258)


[4m[1m > EPOCH: 340/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:38:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 6125[0m
     | > loss: -0.17545  (-0.23767)
     | > log_mle: -0.45091  (-0.46238)
     | > loss_dur: 0.27546  (0.22471)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.61514  (7.10182)
     | > current_lr: 0.00009 
     | > step_time: 0.73570  (0.67481)
     | > loader_time: 0.45040  (0.41918)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00400)
     | > avg_loss:[91m 0.32019 [0m(+0.08245)
     | > avg_log_mle:[91m -0.43076 [0m(+0.00204)
     | > avg_loss_dur:[91m 0.75094 [0m(+0.08041)


[4m[1m > EPOCH: 341/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:39:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 6150[0m
     | > loss: -0.09996  (-0.17587)
     | > log_mle: -0.43805  (-0.44305)
     | > loss_dur: 0.33808  (0.26718)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.69138  (11.02801)
     | > current_lr: 0.00009 
     | > step_time: 0.91180  (0.71324)
     | > loader_time: 0.64560  (0.44323)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00601)
     | > avg_loss:[92m 0.31612 [0m(-0.00407)
     | > avg_log_mle:[91m -0.42047 [0m(+0.01029)
     | > avg_loss_dur:[92m 0.73658 [0m(-0.01436)


[4m[1m > EPOCH: 342/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:39:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00300)
     | > avg_loss:[92m 0.23251 [0m(-0.08360)
     | > avg_log_mle:[92m -0.43844 [0m(-0.01797)
     | > avg_loss_dur:[92m 0.67095 [0m(-0.06563)


[4m[1m > EPOCH: 343/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:40:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 6175[0m
     | > loss: -0.29346  (-0.29346)
     | > log_mle: -0.47043  (-0.47043)
     | > loss_dur: 0.17696  (0.17696)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.15416  (8.15416)
     | > current_lr: 0.00009 
     | > step_time: 0.65160  (0.65159)
     | > loader_time: 0.47740  (0.47743)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00500)
     | > avg_loss:[91m 0.26525 [0m(+0.03274)
     | > avg_log_mle:[91m -0.42605 [0m(+0.01239)
     | > avg_loss_dur:[91m 0.69130 [0m(+0.02034)


[4m[1m > EPOCH: 344/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:41:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 6200[0m
     | > loss: -0.16161  (-0.21101)
     | > log_mle: -0.45841  (-0.45354)
     | > loss_dur: 0.29680  (0.24253)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.00395  (10.66868)
     | > current_lr: 0.00009 
     | > step_time: 0.68060  (0.66948)
     | > loader_time: 0.37630  (0.42501)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00701)
     | > avg_loss:[92m 0.23247 [0m(-0.03278)
     | > avg_log_mle:[92m -0.43410 [0m(-0.00805)
     | > avg_loss_dur:[92m 0.66656 [0m(-0.02473)


[4m[1m > EPOCH: 345/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:41:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 6225[0m
     | > loss: -0.12707  (-0.18220)
     | > log_mle: -0.44018  (-0.45029)
     | > loss_dur: 0.31310  (0.26808)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.52466  (13.40227)
     | > current_lr: 0.00009 
     | > step_time: 0.86880  (0.74908)
     | > loader_time: 0.52350  (0.50005)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.24793 [0m(+0.01547)
     | > avg_log_mle:[92m -0.44146 [0m(-0.00736)
     | > avg_loss_dur:[91m 0.68939 [0m(+0.02282)


[4m[1m > EPOCH: 346/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:42:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00200)
     | > avg_loss:[91m 0.25862 [0m(+0.01068)
     | > avg_log_mle:[91m -0.43965 [0m(+0.00180)
     | > avg_loss_dur:[91m 0.69827 [0m(+0.00888)


[4m[1m > EPOCH: 347/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:42:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 6250[0m
     | > loss: -0.21463  (-0.26435)
     | > log_mle: -0.45920  (-0.46683)
     | > loss_dur: 0.24457  (0.20249)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.92051  (12.74369)
     | > current_lr: 0.00009 
     | > step_time: 0.72870  (0.65935)
     | > loader_time: 0.59350  (0.42238)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00400)
     | > avg_loss:[91m 0.30517 [0m(+0.04655)
     | > avg_log_mle:[91m -0.42416 [0m(+0.01549)
     | > avg_loss_dur:[91m 0.72933 [0m(+0.03106)


[4m[1m > EPOCH: 348/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:43:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 6275[0m
     | > loss: -0.19179  (-0.21062)
     | > log_mle: -0.45225  (-0.45354)
     | > loss_dur: 0.26046  (0.24292)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.28985  (9.19380)
     | > current_lr: 0.00009 
     | > step_time: 0.74070  (0.69827)
     | > loader_time: 0.46140  (0.45277)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00601)
     | > avg_loss:[92m 0.27962 [0m(-0.02554)
     | > avg_log_mle:[92m -0.44223 [0m(-0.01807)
     | > avg_loss_dur:[92m 0.72185 [0m(-0.00747)


[4m[1m > EPOCH: 349/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:43:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07407 [0m(-0.00100)
     | > avg_loss:[91m 0.29203 [0m(+0.01241)
     | > avg_log_mle:[91m -0.43846 [0m(+0.00377)
     | > avg_loss_dur:[91m 0.73049 [0m(+0.00864)


[4m[1m > EPOCH: 350/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:44:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 6300[0m
     | > loss: -0.29350  (-0.29350)
     | > log_mle: -0.47906  (-0.47906)
     | > loss_dur: 0.18556  (0.18556)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.44432  (9.44432)
     | > current_lr: 0.00009 
     | > step_time: 0.50050  (0.50046)
     | > loader_time: 0.28830  (0.28825)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00200)
     | > avg_loss:[92m 0.24554 [0m(-0.04649)
     | > avg_log_mle:[91m -0.42838 [0m(+0.01008)
     | > avg_loss_dur:[92m 0.67392 [0m(-0.05657)


[4m[1m > EPOCH: 351/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:44:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 6325[0m
     | > loss: -0.19173  (-0.23345)
     | > log_mle: -0.45938  (-0.45994)
     | > loss_dur: 0.26766  (0.22649)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.14826  (9.32497)
     | > current_lr: 0.00009 
     | > step_time: 0.64760  (0.66732)
     | > loader_time: 0.38940  (0.40537)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00300)
     | > avg_loss:[91m 0.25376 [0m(+0.00822)
     | > avg_log_mle:[92m -0.43170 [0m(-0.00333)
     | > avg_loss_dur:[91m 0.68546 [0m(+0.01154)


[4m[1m > EPOCH: 352/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:45:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 6350[0m
     | > loss: -0.10673  (-0.19798)
     | > log_mle: -0.43519  (-0.45502)
     | > loss_dur: 0.32846  (0.25704)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.05265  (17.77276)
     | > current_lr: 0.00009 
     | > step_time: 1.01690  (0.74182)
     | > loader_time: 0.61150  (0.47886)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00200)
     | > avg_loss:[91m 0.27408 [0m(+0.02032)
     | > avg_log_mle:[92m -0.44243 [0m(-0.01072)
     | > avg_loss_dur:[91m 0.71651 [0m(+0.03105)


[4m[1m > EPOCH: 353/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:45:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00300)
     | > avg_loss:[92m 0.25896 [0m(-0.01513)
     | > avg_log_mle:[91m -0.42839 [0m(+0.01404)
     | > avg_loss_dur:[92m 0.68735 [0m(-0.02916)


[4m[1m > EPOCH: 354/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:46:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 6375[0m
     | > loss: -0.26192  (-0.29611)
     | > log_mle: -0.46996  (-0.47749)
     | > loss_dur: 0.20803  (0.18138)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.11886  (7.89291)
     | > current_lr: 0.00009 
     | > step_time: 0.68360  (0.63425)
     | > loader_time: 0.42140  (0.36766)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00801)
     | > avg_loss:[91m 0.30097 [0m(+0.04201)
     | > avg_log_mle:[92m -0.43971 [0m(-0.01132)
     | > avg_loss_dur:[91m 0.74068 [0m(+0.05333)


[4m[1m > EPOCH: 355/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:46:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 6400[0m
     | > loss: -0.21071  (-0.23114)
     | > log_mle: -0.44142  (-0.46300)
     | > loss_dur: 0.23072  (0.23185)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.43189  (9.08655)
     | > current_lr: 0.00009 
     | > step_time: 0.69960  (0.69423)
     | > loader_time: 0.48340  (0.44140)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 0.26923 [0m(-0.03174)
     | > avg_log_mle:[91m -0.41646 [0m(+0.02325)
     | > avg_loss_dur:[92m 0.68569 [0m(-0.05499)


[4m[1m > EPOCH: 356/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:47:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 6425[0m
     | > loss: -0.07117  (-0.18219)
     | > log_mle: -0.43010  (-0.45008)
     | > loss_dur: 0.35893  (0.26788)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 41.18139  (12.12293)
     | > current_lr: 0.00009 
     | > step_time: 0.84880  (0.76644)
     | > loader_time: 0.41840  (0.48197)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00601)
     | > avg_loss:[91m 0.27569 [0m(+0.00646)
     | > avg_log_mle:[92m -0.42575 [0m(-0.00929)
     | > avg_loss_dur:[91m 0.70144 [0m(+0.01575)


[4m[1m > EPOCH: 357/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:47:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00601)
     | > avg_loss:[91m 0.31106 [0m(+0.03537)
     | > avg_log_mle:[92m -0.44038 [0m(-0.01463)
     | > avg_loss_dur:[91m 0.75144 [0m(+0.05000)


[4m[1m > EPOCH: 358/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:48:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 6450[0m
     | > loss: -0.16847  (-0.24997)
     | > log_mle: -0.44007  (-0.46475)
     | > loss_dur: 0.27160  (0.21478)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.52271  (13.58195)
     | > current_lr: 0.00009 
     | > step_time: 0.63760  (0.66794)
     | > loader_time: 0.38330  (0.40153)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00300)
     | > avg_loss:[91m 0.32727 [0m(+0.01621)
     | > avg_log_mle:[91m -0.44029 [0m(+0.00009)
     | > avg_loss_dur:[91m 0.76756 [0m(+0.01612)


[4m[1m > EPOCH: 359/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:49:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 6475[0m
     | > loss: -0.13421  (-0.22021)
     | > log_mle: -0.44374  (-0.46211)
     | > loss_dur: 0.30953  (0.24190)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.25364  (12.05963)
     | > current_lr: 0.00009 
     | > step_time: 0.78870  (0.72404)
     | > loader_time: 0.47840  (0.45603)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 0.24312 [0m(-0.08415)
     | > avg_log_mle:[92m -0.44652 [0m(-0.00623)
     | > avg_loss_dur:[92m 0.68964 [0m(-0.07792)


[4m[1m > EPOCH: 360/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:49:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00100)
     | > avg_loss:[91m 0.27708 [0m(+0.03396)
     | > avg_log_mle:[91m -0.43876 [0m(+0.00776)
     | > avg_loss_dur:[91m 0.71583 [0m(+0.02620)


[4m[1m > EPOCH: 361/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:50:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 6500[0m
     | > loss: -0.31303  (-0.31904)
     | > log_mle: -0.48832  (-0.48505)
     | > loss_dur: 0.17530  (0.16601)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.54195  (8.68442)
     | > current_lr: 0.00009 
     | > step_time: 0.56450  (0.61156)
     | > loader_time: 0.35730  (0.37934)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[91m 0.31302 [0m(+0.03595)
     | > avg_log_mle:[91m -0.43302 [0m(+0.00574)
     | > avg_loss_dur:[91m 0.74604 [0m(+0.03021)


[4m[1m > EPOCH: 362/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:50:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 6525[0m
     | > loss: -0.19914  (-0.24218)
     | > log_mle: -0.46553  (-0.46672)
     | > loss_dur: 0.26639  (0.22453)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.90804  (8.12190)
     | > current_lr: 0.00009 
     | > step_time: 0.86280  (0.68985)
     | > loader_time: 0.67260  (0.46142)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00100)
     | > avg_loss:[92m 0.26455 [0m(-0.04848)
     | > avg_log_mle:[91m -0.43270 [0m(+0.00032)
     | > avg_loss_dur:[92m 0.69725 [0m(-0.04879)


[4m[1m > EPOCH: 363/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:51:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 6550[0m
     | > loss: -0.11862  (-0.19749)
     | > log_mle: -0.43737  (-0.45617)
     | > loss_dur: 0.31875  (0.25868)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.47024  (11.34568)
     | > current_lr: 0.00009 
     | > step_time: 0.95890  (0.76902)
     | > loader_time: 0.63260  (0.51884)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00601)
     | > avg_loss:[91m 0.28000 [0m(+0.01545)
     | > avg_log_mle:[92m -0.43654 [0m(-0.00384)
     | > avg_loss_dur:[91m 0.71654 [0m(+0.01929)


[4m[1m > EPOCH: 364/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:51:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00701)
     | > avg_loss:[91m 0.29099 [0m(+0.01099)
     | > avg_log_mle:[92m -0.44676 [0m(-0.01022)
     | > avg_loss_dur:[91m 0.73775 [0m(+0.02121)


[4m[1m > EPOCH: 365/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:52:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 6575[0m
     | > loss: -0.19031  (-0.26430)
     | > log_mle: -0.45665  (-0.47233)
     | > loss_dur: 0.26634  (0.20803)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.65136  (7.15976)
     | > current_lr: 0.00009 
     | > step_time: 0.74170  (0.67241)
     | > loader_time: 0.47640  (0.44981)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00100)
     | > avg_loss:[92m 0.28990 [0m(-0.00108)
     | > avg_log_mle:[91m -0.43617 [0m(+0.01059)
     | > avg_loss_dur:[92m 0.72608 [0m(-0.01168)


[4m[1m > EPOCH: 366/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:52:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 6600[0m
     | > loss: -0.16358  (-0.23320)
     | > log_mle: -0.45778  (-0.46665)
     | > loss_dur: 0.29419  (0.23345)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.31145  (10.43084)
     | > current_lr: 0.00009 
     | > step_time: 0.91280  (0.71682)
     | > loader_time: 0.62460  (0.46033)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[92m 0.27660 [0m(-0.01331)
     | > avg_log_mle:[92m -0.44891 [0m(-0.01274)
     | > avg_loss_dur:[92m 0.72551 [0m(-0.00057)


[4m[1m > EPOCH: 367/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:53:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00300)
     | > avg_loss:[91m 0.28504 [0m(+0.00845)
     | > avg_log_mle:[91m -0.44817 [0m(+0.00074)
     | > avg_loss_dur:[91m 0.73321 [0m(+0.00770)


[4m[1m > EPOCH: 368/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:53:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 6625[0m
     | > loss: -0.32319  (-0.32319)
     | > log_mle: -0.48929  (-0.48929)
     | > loss_dur: 0.16609  (0.16609)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.44145  (5.44145)
     | > current_lr: 0.00009 
     | > step_time: 0.64860  (0.64859)
     | > loader_time: 0.39040  (0.39035)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00901)
     | > avg_loss:[92m 0.26110 [0m(-0.02394)
     | > avg_log_mle:[91m -0.44777 [0m(+0.00041)
     | > avg_loss_dur:[92m 0.70887 [0m(-0.02435)


[4m[1m > EPOCH: 369/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:54:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 6650[0m
     | > loss: -0.22093  (-0.26129)
     | > log_mle: -0.48113  (-0.47859)
     | > loss_dur: 0.26020  (0.21730)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.21652  (14.42297)
     | > current_lr: 0.00009 
     | > step_time: 0.68360  (0.66836)
     | > loader_time: 0.42540  (0.40775)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00400)
     | > avg_loss:[91m 0.27682 [0m(+0.01572)
     | > avg_log_mle:[91m -0.44451 [0m(+0.00326)
     | > avg_loss_dur:[91m 0.72132 [0m(+0.01245)


[4m[1m > EPOCH: 370/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:54:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 6675[0m
     | > loss: -0.13027  (-0.20352)
     | > log_mle: -0.44173  (-0.46018)
     | > loss_dur: 0.31146  (0.25666)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.23314  (13.44846)
     | > current_lr: 0.00009 
     | > step_time: 0.87780  (0.75249)
     | > loader_time: 0.53850  (0.48437)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[91m 0.32244 [0m(+0.04562)
     | > avg_log_mle:[91m -0.44223 [0m(+0.00227)
     | > avg_loss_dur:[91m 0.76468 [0m(+0.04335)


[4m[1m > EPOCH: 371/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:55:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00701)
     | > avg_loss:[92m 0.25024 [0m(-0.07220)
     | > avg_log_mle:[92m -0.44261 [0m(-0.00038)
     | > avg_loss_dur:[92m 0.69285 [0m(-0.07183)


[4m[1m > EPOCH: 372/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:55:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 6700[0m
     | > loss: -0.24542  (-0.30107)
     | > log_mle: -0.46703  (-0.48451)
     | > loss_dur: 0.22161  (0.18344)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.25175  (10.10456)
     | > current_lr: 0.00009 
     | > step_time: 0.73070  (0.65835)
     | > loader_time: 0.50750  (0.43264)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01201)
     | > avg_loss:[91m 0.29655 [0m(+0.04631)
     | > avg_log_mle:[92m -0.44792 [0m(-0.00531)
     | > avg_loss_dur:[91m 0.74447 [0m(+0.05162)


[4m[1m > EPOCH: 373/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:56:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 6725[0m
     | > loss: -0.21610  (-0.25176)
     | > log_mle: -0.46867  (-0.47470)
     | > loss_dur: 0.25257  (0.22295)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.76487  (14.17577)
     | > current_lr: 0.00009 
     | > step_time: 0.73770  (0.69582)
     | > loader_time: 0.45140  (0.46551)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00801)
     | > avg_loss:[92m 0.25085 [0m(-0.04569)
     | > avg_log_mle:[92m -0.44810 [0m(-0.00018)
     | > avg_loss_dur:[92m 0.69895 [0m(-0.04552)


[4m[1m > EPOCH: 374/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:57:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00000)
     | > avg_loss:[91m 0.28845 [0m(+0.03760)
     | > avg_log_mle:[91m -0.44317 [0m(+0.00493)
     | > avg_loss_dur:[91m 0.73162 [0m(+0.03267)


[4m[1m > EPOCH: 375/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:57:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 6750[0m
     | > loss: -0.34967  (-0.34967)
     | > log_mle: -0.49949  (-0.49949)
     | > loss_dur: 0.14982  (0.14982)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.92248  (18.92248)
     | > current_lr: 0.00009 
     | > step_time: 0.66560  (0.66561)
     | > loader_time: 0.26820  (0.26824)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 0.26891 [0m(-0.01954)
     | > avg_log_mle:[92m -0.45175 [0m(-0.00857)
     | > avg_loss_dur:[92m 0.72066 [0m(-0.01097)


[4m[1m > EPOCH: 376/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:58:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 6775[0m
     | > loss: -0.21140  (-0.26830)
     | > log_mle: -0.46311  (-0.47612)
     | > loss_dur: 0.25171  (0.20783)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 30.13211  (16.35290)
     | > current_lr: 0.00009 
     | > step_time: 0.64660  (0.66189)
     | > loader_time: 0.38940  (0.39193)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00701)
     | > avg_loss:[91m 0.31669 [0m(+0.04777)
     | > avg_log_mle:[91m -0.42871 [0m(+0.02303)
     | > avg_loss_dur:[91m 0.74540 [0m(+0.02474)


[4m[1m > EPOCH: 377/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:58:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 6800[0m
     | > loss: -0.13135  (-0.22695)
     | > log_mle: -0.43919  (-0.46533)
     | > loss_dur: 0.30784  (0.23838)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.80689  (9.94883)
     | > current_lr: 0.00009 
     | > step_time: 1.01990  (0.74060)
     | > loader_time: 0.61660  (0.47407)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00400)
     | > avg_loss:[91m 0.32289 [0m(+0.00620)
     | > avg_log_mle:[92m -0.44277 [0m(-0.01406)
     | > avg_loss_dur:[91m 0.76566 [0m(+0.02026)


[4m[1m > EPOCH: 378/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:59:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[92m 0.26195 [0m(-0.06094)
     | > avg_log_mle:[92m -0.44755 [0m(-0.00478)
     | > avg_loss_dur:[92m 0.70949 [0m(-0.05616)


[4m[1m > EPOCH: 379/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 07:59:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 6825[0m
     | > loss: -0.30907  (-0.32957)
     | > log_mle: -0.49464  (-0.49455)
     | > loss_dur: 0.18557  (0.16498)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.15681  (7.42627)
     | > current_lr: 0.00009 
     | > step_time: 0.68960  (0.63391)
     | > loader_time: 0.41140  (0.38969)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[91m 0.27048 [0m(+0.00853)
     | > avg_log_mle:[91m -0.43198 [0m(+0.01557)
     | > avg_loss_dur:[92m 0.70246 [0m(-0.00704)


[4m[1m > EPOCH: 380/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:00:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 6850[0m
     | > loss: -0.21065  (-0.25334)
     | > log_mle: -0.44931  (-0.47186)
     | > loss_dur: 0.23865  (0.21853)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.54489  (7.07868)
     | > current_lr: 0.00010 
     | > step_time: 0.69960  (0.68933)
     | > loader_time: 0.44540  (0.42439)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00300)
     | > avg_loss:[92m 0.22796 [0m(-0.04252)
     | > avg_log_mle:[92m -0.44526 [0m(-0.01328)
     | > avg_loss_dur:[92m 0.67322 [0m(-0.02924)


[4m[1m > EPOCH: 381/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:00:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 6875[0m
     | > loss: -0.16041  (-0.22008)
     | > log_mle: -0.45554  (-0.46531)
     | > loss_dur: 0.29513  (0.24523)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.95088  (11.51970)
     | > current_lr: 0.00010 
     | > step_time: 0.84480  (0.76799)
     | > loader_time: 0.43340  (0.49368)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00901)
     | > avg_loss:[91m 0.27858 [0m(+0.05062)
     | > avg_log_mle:[92m -0.44983 [0m(-0.00457)
     | > avg_loss_dur:[91m 0.72841 [0m(+0.05519)


[4m[1m > EPOCH: 382/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:01:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00901)
     | > avg_loss:[92m 0.25096 [0m(-0.02762)
     | > avg_log_mle:[91m -0.43280 [0m(+0.01703)
     | > avg_loss_dur:[92m 0.68377 [0m(-0.04465)


[4m[1m > EPOCH: 383/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:01:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 6900[0m
     | > loss: -0.20980  (-0.27876)
     | > log_mle: -0.46116  (-0.48268)
     | > loss_dur: 0.25136  (0.20391)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 28.35245  (21.30995)
     | > current_lr: 0.00010 
     | > step_time: 0.63960  (0.66978)
     | > loader_time: 0.41940  (0.41738)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00500)
     | > avg_loss:[92m 0.24279 [0m(-0.00818)
     | > avg_log_mle:[92m -0.45041 [0m(-0.01761)
     | > avg_loss_dur:[91m 0.69320 [0m(+0.00944)


[4m[1m > EPOCH: 384/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:02:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 6925[0m
     | > loss: -0.19114  (-0.25636)
     | > log_mle: -0.46220  (-0.48025)
     | > loss_dur: 0.27106  (0.22389)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 28.72013  (13.04135)
     | > current_lr: 0.00010 
     | > step_time: 0.78570  (0.71966)
     | > loader_time: 0.48240  (0.45972)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00100)
     | > avg_loss:[91m 0.24994 [0m(+0.00715)
     | > avg_log_mle:[91m -0.44793 [0m(+0.00248)
     | > avg_loss_dur:[91m 0.69787 [0m(+0.00466)


[4m[1m > EPOCH: 385/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:02:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00501)
     | > avg_loss:[91m 0.28788 [0m(+0.03795)
     | > avg_log_mle:[92m -0.44983 [0m(-0.00190)
     | > avg_loss_dur:[91m 0.73772 [0m(+0.03985)


[4m[1m > EPOCH: 386/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:03:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 6950[0m
     | > loss: -0.32395  (-0.34108)
     | > log_mle: -0.49026  (-0.49470)
     | > loss_dur: 0.16631  (0.15362)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.19086  (16.59582)
     | > current_lr: 0.00010 
     | > step_time: 0.56450  (0.61006)
     | > loader_time: 0.33830  (0.34131)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00300)
     | > avg_loss:[91m 0.30662 [0m(+0.01874)
     | > avg_log_mle:[91m -0.43128 [0m(+0.01855)
     | > avg_loss_dur:[91m 0.73791 [0m(+0.00019)


[4m[1m > EPOCH: 387/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:03:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 6975[0m
     | > loss: -0.21846  (-0.26240)
     | > log_mle: -0.46935  (-0.47480)
     | > loss_dur: 0.25090  (0.21240)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 34.98870  (16.96942)
     | > current_lr: 0.00010 
     | > step_time: 0.87480  (0.69107)
     | > loader_time: 0.58750  (0.43039)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[92m 0.25947 [0m(-0.04716)
     | > avg_log_mle:[91m -0.43015 [0m(+0.00113)
     | > avg_loss_dur:[92m 0.68962 [0m(-0.04829)


[4m[1m > EPOCH: 388/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:04:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 7000[0m
     | > loss: -0.17111  (-0.22861)
     | > log_mle: -0.45167  (-0.46863)
     | > loss_dur: 0.28057  (0.24002)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.51612  (11.37229)
     | > current_lr: 0.00010 
     | > step_time: 0.94890  (0.76182)
     | > loader_time: 0.60760  (0.49689)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00200)
     | > avg_loss:[92m 0.25180 [0m(-0.00766)
     | > avg_log_mle:[92m -0.44901 [0m(-0.01886)
     | > avg_loss_dur:[91m 0.70082 [0m(+0.01120)


[4m[1m > EPOCH: 389/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:05:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00400)
     | > avg_loss:[91m 0.30245 [0m(+0.05065)
     | > avg_log_mle:[92m -0.45150 [0m(-0.00249)
     | > avg_loss_dur:[91m 0.75395 [0m(+0.05314)


[4m[1m > EPOCH: 390/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:05:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 7025[0m
     | > loss: -0.27891  (-0.32520)
     | > log_mle: -0.48340  (-0.49758)
     | > loss_dur: 0.20449  (0.17238)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.36677  (7.86568)
     | > current_lr: 0.00010 
     | > step_time: 0.74470  (0.67441)
     | > loader_time: 0.44240  (0.41257)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00200)
     | > avg_loss:[91m 0.32922 [0m(+0.02677)
     | > avg_log_mle:[91m -0.44250 [0m(+0.00900)
     | > avg_loss_dur:[91m 0.77172 [0m(+0.01777)


[4m[1m > EPOCH: 391/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:06:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 7050[0m
     | > loss: -0.20555  (-0.27428)
     | > log_mle: -0.47223  (-0.48294)
     | > loss_dur: 0.26668  (0.20866)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 24.73377  (11.16645)
     | > current_lr: 0.00010 
     | > step_time: 0.91380  (0.71198)
     | > loader_time: 0.62560  (0.44832)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00400)
     | > avg_loss:[92m 0.27461 [0m(-0.05461)
     | > avg_log_mle:[92m -0.44582 [0m(-0.00332)
     | > avg_loss_dur:[92m 0.72043 [0m(-0.05129)


[4m[1m > EPOCH: 392/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:06:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06306 [0m(+0.00100)
     | > avg_loss:[91m 0.30344 [0m(+0.02882)
     | > avg_log_mle:[91m -0.42594 [0m(+0.01988)
     | > avg_loss_dur:[91m 0.72938 [0m(+0.00894)


[4m[1m > EPOCH: 393/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:07:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 7075[0m
     | > loss: -0.36809  (-0.36809)
     | > log_mle: -0.50095  (-0.50095)
     | > loss_dur: 0.13286  (0.13286)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 32.18478  (32.18478)
     | > current_lr: 0.00010 
     | > step_time: 0.65260  (0.65259)
     | > loader_time: 0.38940  (0.38935)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01501)
     | > avg_loss:[91m 0.35624 [0m(+0.05281)
     | > avg_log_mle:[92m -0.42899 [0m(-0.00305)
     | > avg_loss_dur:[91m 0.78523 [0m(+0.05585)


[4m[1m > EPOCH: 394/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:07:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 7100[0m
     | > loss: -0.25217  (-0.28436)
     | > log_mle: -0.48642  (-0.48490)
     | > loss_dur: 0.23425  (0.20054)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.84664  (12.79391)
     | > current_lr: 0.00010 
     | > step_time: 0.67660  (0.66786)
     | > loader_time: 0.38030  (0.40287)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.01101)
     | > avg_loss:[92m 0.31193 [0m(-0.04431)
     | > avg_log_mle:[92m -0.44864 [0m(-0.01965)
     | > avg_loss_dur:[92m 0.76057 [0m(-0.02466)


[4m[1m > EPOCH: 395/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:08:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 7125[0m
     | > loss: -0.19744  (-0.24877)
     | > log_mle: -0.46185  (-0.47847)
     | > loss_dur: 0.26440  (0.22970)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.60569  (11.09057)
     | > current_lr: 0.00010 
     | > step_time: 0.87280  (0.74935)
     | > loader_time: 0.58450  (0.47096)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[91m 0.31836 [0m(+0.00643)
     | > avg_log_mle:[92m -0.45298 [0m(-0.00434)
     | > avg_loss_dur:[91m 0.77134 [0m(+0.01078)


[4m[1m > EPOCH: 396/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:08:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[92m 0.29465 [0m(-0.02371)
     | > avg_log_mle:[91m -0.44295 [0m(+0.01004)
     | > avg_loss_dur:[92m 0.73760 [0m(-0.03375)


[4m[1m > EPOCH: 397/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:09:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 7150[0m
     | > loss: -0.28296  (-0.33528)
     | > log_mle: -0.48869  (-0.50162)
     | > loss_dur: 0.20573  (0.16634)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.98257  (12.42870)
     | > current_lr: 0.00010 
     | > step_time: 0.72770  (0.65860)
     | > loader_time: 0.58750  (0.43289)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00400)
     | > avg_loss:[92m 0.27217 [0m(-0.02249)
     | > avg_log_mle:[91m -0.41381 [0m(+0.02913)
     | > avg_loss_dur:[92m 0.68598 [0m(-0.05162)


[4m[1m > EPOCH: 398/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:09:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 7175[0m
     | > loss: -0.25016  (-0.26819)
     | > log_mle: -0.47048  (-0.47544)
     | > loss_dur: 0.22031  (0.20725)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.02940  (12.27385)
     | > current_lr: 0.00010 
     | > step_time: 0.74070  (0.69736)
     | > loader_time: 0.50050  (0.44049)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00400)
     | > avg_loss:[91m 0.31517 [0m(+0.04300)
     | > avg_log_mle:[92m -0.43311 [0m(-0.01929)
     | > avg_loss_dur:[91m 0.74828 [0m(+0.06230)


[4m[1m > EPOCH: 399/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:10:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00801)
     | > avg_loss:[92m 0.28436 [0m(-0.03081)
     | > avg_log_mle:[92m -0.44994 [0m(-0.01684)
     | > avg_loss_dur:[92m 0.73430 [0m(-0.01398)


[4m[1m > EPOCH: 400/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:10:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 7200[0m
     | > loss: -0.34904  (-0.34904)
     | > log_mle: -0.50999  (-0.50999)
     | > loss_dur: 0.16095  (0.16095)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.93573  (8.93573)
     | > current_lr: 0.00010 
     | > step_time: 0.50050  (0.50046)
     | > loader_time: 0.28520  (0.28525)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00300)
     | > avg_loss:[91m 0.28839 [0m(+0.00403)
     | > avg_log_mle:[92m -0.45277 [0m(-0.00283)
     | > avg_loss_dur:[91m 0.74116 [0m(+0.00686)


[4m[1m > EPOCH: 401/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:11:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 7225[0m
     | > loss: -0.25431  (-0.31274)
     | > log_mle: -0.49068  (-0.49839)
     | > loss_dur: 0.23637  (0.18566)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.05872  (14.52972)
     | > current_lr: 0.00010 
     | > step_time: 0.64560  (0.66561)
     | > loader_time: 0.40840  (0.41195)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[92m 0.27569 [0m(-0.01270)
     | > avg_log_mle:[92m -0.45385 [0m(-0.00108)
     | > avg_loss_dur:[92m 0.72954 [0m(-0.01162)


[4m[1m > EPOCH: 402/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:11:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 7250[0m
     | > loss: -0.20061  (-0.27573)
     | > log_mle: -0.46107  (-0.48930)
     | > loss_dur: 0.26046  (0.21357)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.23166  (15.10576)
     | > current_lr: 0.00010 
     | > step_time: 1.02690  (0.74010)
     | > loader_time: 0.61060  (0.47229)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.00300)
     | > avg_loss:[91m 0.31238 [0m(+0.03668)
     | > avg_log_mle:[91m -0.44902 [0m(+0.00483)
     | > avg_loss_dur:[91m 0.76139 [0m(+0.03185)


[4m[1m > EPOCH: 403/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:12:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00901)
     | > avg_loss:[92m 0.24419 [0m(-0.06819)
     | > avg_log_mle:[92m -0.45269 [0m(-0.00367)
     | > avg_loss_dur:[92m 0.69688 [0m(-0.06452)


[4m[1m > EPOCH: 404/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:12:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 7275[0m
     | > loss: -0.35775  (-0.37319)
     | > log_mle: -0.51140  (-0.51563)
     | > loss_dur: 0.15365  (0.14244)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.34357  (9.30644)
     | > current_lr: 0.00010 
     | > step_time: 0.68760  (0.63424)
     | > loader_time: 0.41940  (0.44273)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[91m 0.31899 [0m(+0.07481)
     | > avg_log_mle:[91m -0.44753 [0m(+0.00516)
     | > avg_loss_dur:[91m 0.76652 [0m(+0.06965)


[4m[1m > EPOCH: 405/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:13:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 7300[0m
     | > loss: -0.26385  (-0.30072)
     | > log_mle: -0.47030  (-0.49424)
     | > loss_dur: 0.20644  (0.19352)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.76749  (13.19964)
     | > current_lr: 0.00010 
     | > step_time: 0.70370  (0.69413)
     | > loader_time: 0.45040  (0.43730)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00500)
     | > avg_loss:[92m 0.25847 [0m(-0.06053)
     | > avg_log_mle:[91m -0.44466 [0m(+0.00287)
     | > avg_loss_dur:[92m 0.70313 [0m(-0.06340)


[4m[1m > EPOCH: 406/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:13:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 7325[0m
     | > loss: -0.20328  (-0.26696)
     | > log_mle: -0.46982  (-0.48464)
     | > loss_dur: 0.26653  (0.21769)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.57192  (10.75111)
     | > current_lr: 0.00010 
     | > step_time: 0.84780  (0.76695)
     | > loader_time: 0.45840  (0.47260)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00000)
     | > avg_loss:[91m 0.30470 [0m(+0.04623)
     | > avg_log_mle:[92m -0.45564 [0m(-0.01098)
     | > avg_loss_dur:[91m 0.76034 [0m(+0.05721)


[4m[1m > EPOCH: 407/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:14:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00500)
     | > avg_loss:[92m 0.29819 [0m(-0.00650)
     | > avg_log_mle:[91m -0.41788 [0m(+0.03777)
     | > avg_loss_dur:[92m 0.71607 [0m(-0.04427)


[4m[1m > EPOCH: 408/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:15:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 7350[0m
     | > loss: -0.25261  (-0.30124)
     | > log_mle: -0.46611  (-0.48570)
     | > loss_dur: 0.21351  (0.18446)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.30452  (10.08405)
     | > current_lr: 0.00010 
     | > step_time: 0.63760  (0.66661)
     | > loader_time: 0.37230  (0.40253)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00400)
     | > avg_loss:[92m 0.29402 [0m(-0.00418)
     | > avg_log_mle:[92m -0.44345 [0m(-0.02557)
     | > avg_loss_dur:[91m 0.73746 [0m(+0.02139)


[4m[1m > EPOCH: 409/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:15:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 7375[0m
     | > loss: -0.18336  (-0.27489)
     | > log_mle: -0.46777  (-0.48563)
     | > loss_dur: 0.28441  (0.21075)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.07073  (13.23125)
     | > current_lr: 0.00010 
     | > step_time: 0.78870  (0.72196)
     | > loader_time: 0.50950  (0.46126)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00400)
     | > avg_loss:[92m 0.27690 [0m(-0.01711)
     | > avg_log_mle:[91m -0.44288 [0m(+0.00056)
     | > avg_loss_dur:[92m 0.71979 [0m(-0.01768)


[4m[1m > EPOCH: 410/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:16:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00500)
     | > avg_loss:[91m 0.33005 [0m(+0.05314)
     | > avg_log_mle:[92m -0.44623 [0m(-0.00335)
     | > avg_loss_dur:[91m 0.77628 [0m(+0.05649)


[4m[1m > EPOCH: 411/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:16:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 7400[0m
     | > loss: -0.35118  (-0.35300)
     | > log_mle: -0.50716  (-0.50377)
     | > loss_dur: 0.15597  (0.15077)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.45401  (6.57639)
     | > current_lr: 0.00010 
     | > step_time: 0.56350  (0.60405)
     | > loader_time: 0.35830  (0.36333)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[91m 0.34506 [0m(+0.01501)
     | > avg_log_mle:[91m -0.43671 [0m(+0.00952)
     | > avg_loss_dur:[91m 0.78177 [0m(+0.00549)


[4m[1m > EPOCH: 412/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:17:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 7425[0m
     | > loss: -0.22392  (-0.28392)
     | > log_mle: -0.48179  (-0.48941)
     | > loss_dur: 0.25787  (0.20549)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.37469  (14.17702)
     | > current_lr: 0.00010 
     | > step_time: 0.87980  (0.69052)
     | > loader_time: 0.61560  (0.43339)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00500)
     | > avg_loss:[92m 0.27768 [0m(-0.06738)
     | > avg_log_mle:[92m -0.44955 [0m(-0.01285)
     | > avg_loss_dur:[92m 0.72723 [0m(-0.05454)


[4m[1m > EPOCH: 413/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:17:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 7450[0m
     | > loss: -0.19691  (-0.26759)
     | > log_mle: -0.46323  (-0.48650)
     | > loss_dur: 0.26631  (0.21891)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.78950  (10.46800)
     | > current_lr: 0.00010 
     | > step_time: 0.95590  (0.76188)
     | > loader_time: 0.57550  (0.46961)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00500)
     | > avg_loss:[92m 0.27200 [0m(-0.00568)
     | > avg_log_mle:[91m -0.44236 [0m(+0.00719)
     | > avg_loss_dur:[92m 0.71436 [0m(-0.01287)


[4m[1m > EPOCH: 414/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:18:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00801)
     | > avg_loss:[91m 0.30807 [0m(+0.03607)
     | > avg_log_mle:[92m -0.44959 [0m(-0.00722)
     | > avg_loss_dur:[91m 0.75765 [0m(+0.04329)


[4m[1m > EPOCH: 415/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:18:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 7475[0m
     | > loss: -0.28766  (-0.34380)
     | > log_mle: -0.49370  (-0.50797)
     | > loss_dur: 0.20603  (0.16417)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.36783  (11.64986)
     | > current_lr: 0.00010 
     | > step_time: 0.74570  (0.67261)
     | > loader_time: 0.45740  (0.41958)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00501)
     | > avg_loss:[91m 0.34100 [0m(+0.03293)
     | > avg_log_mle:[92m -0.45342 [0m(-0.00383)
     | > avg_loss_dur:[91m 0.79442 [0m(+0.03676)


[4m[1m > EPOCH: 416/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:19:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 7500[0m
     | > loss: -0.25252  (-0.30697)
     | > log_mle: -0.48692  (-0.49847)
     | > loss_dur: 0.23439  (0.19151)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.14025  (11.55149)
     | > current_lr: 0.00010 
     | > step_time: 0.91680  (0.71448)
     | > loader_time: 0.61960  (0.45633)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[92m 0.30484 [0m(-0.03615)
     | > avg_log_mle:[92m -0.45736 [0m(-0.00394)
     | > avg_loss_dur:[92m 0.76220 [0m(-0.03222)


[4m[1m > EPOCH: 417/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:19:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00300)
     | > avg_loss:[92m 0.29670 [0m(-0.00815)
     | > avg_log_mle:[91m -0.45505 [0m(+0.00231)
     | > avg_loss_dur:[92m 0.75175 [0m(-0.01045)


[4m[1m > EPOCH: 418/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:20:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 7525[0m
     | > loss: -0.38479  (-0.38479)
     | > log_mle: -0.52095  (-0.52095)
     | > loss_dur: 0.13616  (0.13616)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.08042  (10.08042)
     | > current_lr: 0.00010 
     | > step_time: 0.65060  (0.65059)
     | > loader_time: 0.39940  (0.39936)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00600)
     | > avg_loss:[91m 0.32797 [0m(+0.03127)
     | > avg_log_mle:[91m -0.43464 [0m(+0.02041)
     | > avg_loss_dur:[91m 0.76261 [0m(+0.01086)


[4m[1m > EPOCH: 419/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:20:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 7550[0m
     | > loss: -0.27725  (-0.30691)
     | > log_mle: -0.49774  (-0.49519)
     | > loss_dur: 0.22048  (0.18829)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.48517  (11.92048)
     | > current_lr: 0.00010 
     | > step_time: 0.67760  (0.66573)
     | > loader_time: 0.42440  (0.41100)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00701)
     | > avg_loss:[92m 0.29830 [0m(-0.02967)
     | > avg_log_mle:[92m -0.44889 [0m(-0.01425)
     | > avg_loss_dur:[92m 0.74719 [0m(-0.01542)


[4m[1m > EPOCH: 420/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:21:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 7575[0m
     | > loss: -0.17905  (-0.26474)
     | > log_mle: -0.46743  (-0.48619)
     | > loss_dur: 0.28838  (0.22144)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.46529  (10.70234)
     | > current_lr: 0.00011 
     | > step_time: 0.88280  (0.75048)
     | > loader_time: 0.55650  (0.47470)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00400)
     | > avg_loss:[92m 0.25461 [0m(-0.04369)
     | > avg_log_mle:[92m -0.45187 [0m(-0.00298)
     | > avg_loss_dur:[92m 0.70648 [0m(-0.04071)


[4m[1m > EPOCH: 421/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:21:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00801)
     | > avg_loss:[91m 0.30189 [0m(+0.04728)
     | > avg_log_mle:[91m -0.43330 [0m(+0.01856)
     | > avg_loss_dur:[91m 0.73520 [0m(+0.02872)


[4m[1m > EPOCH: 422/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:22:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 7600[0m
     | > loss: -0.29362  (-0.34692)
     | > log_mle: -0.49584  (-0.51039)
     | > loss_dur: 0.20223  (0.16347)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.79509  (8.59628)
     | > current_lr: 0.00011 
     | > step_time: 0.73270  (0.65810)
     | > loader_time: 0.48140  (0.39561)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00600)
     | > avg_loss:[91m 0.32446 [0m(+0.02257)
     | > avg_log_mle:[92m -0.45088 [0m(-0.01758)
     | > avg_loss_dur:[91m 0.77534 [0m(+0.04014)


[4m[1m > EPOCH: 423/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:22:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 7625[0m
     | > loss: -0.29641  (-0.29984)
     | > log_mle: -0.49575  (-0.49810)
     | > loss_dur: 0.19934  (0.19826)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.90878  (14.62297)
     | > current_lr: 0.00011 
     | > step_time: 0.73570  (0.69600)
     | > loader_time: 0.48140  (0.44850)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00200)
     | > avg_loss:[92m 0.21511 [0m(-0.10935)
     | > avg_log_mle:[92m -0.45813 [0m(-0.00725)
     | > avg_loss_dur:[92m 0.67324 [0m(-0.10210)


[4m[1m > EPOCH: 424/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:23:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00601)
     | > avg_loss:[91m 0.32641 [0m(+0.11130)
     | > avg_log_mle:[91m -0.45133 [0m(+0.00681)
     | > avg_loss_dur:[91m 0.77774 [0m(+0.10450)


[4m[1m > EPOCH: 425/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:23:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 7650[0m
     | > loss: -0.40386  (-0.40386)
     | > log_mle: -0.53148  (-0.53148)
     | > loss_dur: 0.12762  (0.12762)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 28.59150  (28.59150)
     | > current_lr: 0.00011 
     | > step_time: 0.68060  (0.68062)
     | > loader_time: 0.28830  (0.28826)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.34315 [0m(+0.01673)
     | > avg_log_mle:[91m -0.42815 [0m(+0.02317)
     | > avg_loss_dur:[92m 0.77130 [0m(-0.00644)


[4m[1m > EPOCH: 426/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:24:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 7675[0m
     | > loss: -0.28149  (-0.32314)
     | > log_mle: -0.49281  (-0.50022)
     | > loss_dur: 0.21133  (0.17708)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.22948  (10.10986)
     | > current_lr: 0.00011 
     | > step_time: 0.64960  (0.66532)
     | > loader_time: 0.41840  (0.41352)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00601)
     | > avg_loss:[92m 0.29599 [0m(-0.04716)
     | > avg_log_mle:[92m -0.45314 [0m(-0.02498)
     | > avg_loss_dur:[92m 0.74912 [0m(-0.02218)


[4m[1m > EPOCH: 427/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:25:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 7700[0m
     | > loss: -0.23774  (-0.29844)
     | > log_mle: -0.47360  (-0.49721)
     | > loss_dur: 0.23586  (0.19877)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.47337  (13.06787)
     | > current_lr: 0.00011 
     | > step_time: 1.02490  (0.74375)
     | > loader_time: 0.60960  (0.47150)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00500)
     | > avg_loss:[92m 0.27968 [0m(-0.01631)
     | > avg_log_mle:[92m -0.45948 [0m(-0.00635)
     | > avg_loss_dur:[92m 0.73916 [0m(-0.00996)


[4m[1m > EPOCH: 428/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:25:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00501)
     | > avg_loss:[91m 0.32530 [0m(+0.04562)
     | > avg_log_mle:[91m -0.45536 [0m(+0.00413)
     | > avg_loss_dur:[91m 0.78066 [0m(+0.04150)


[4m[1m > EPOCH: 429/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:26:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 7725[0m
     | > loss: -0.37225  (-0.39174)
     | > log_mle: -0.52408  (-0.53034)
     | > loss_dur: 0.15184  (0.13860)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.63261  (11.22997)
     | > current_lr: 0.00011 
     | > step_time: 0.68660  (0.63291)
     | > loader_time: 0.39440  (0.36533)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06505 [0m(-0.01002)
     | > avg_loss:[91m 0.35315 [0m(+0.02785)
     | > avg_log_mle:[91m -0.45269 [0m(+0.00267)
     | > avg_loss_dur:[91m 0.80584 [0m(+0.02518)


[4m[1m > EPOCH: 430/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:26:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 7750[0m
     | > loss: -0.29212  (-0.32325)
     | > log_mle: -0.48041  (-0.50802)
     | > loss_dur: 0.18829  (0.18477)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 19.97865  (10.53941)
     | > current_lr: 0.00011 
     | > step_time: 0.70360  (0.69123)
     | > loader_time: 0.42640  (0.44440)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00101)
     | > avg_loss:[92m 0.33436 [0m(-0.01879)
     | > avg_log_mle:[91m -0.45096 [0m(+0.00173)
     | > avg_loss_dur:[92m 0.78532 [0m(-0.02052)


[4m[1m > EPOCH: 431/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:27:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 7775[0m
     | > loss: -0.21989  (-0.26717)
     | > log_mle: -0.47242  (-0.48420)
     | > loss_dur: 0.25253  (0.21703)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.66039  (13.56351)
     | > current_lr: 0.00011 
     | > step_time: 0.85580  (0.77376)
     | > loader_time: 0.45340  (0.47979)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.06606 [0m(+0.00000)
     | > avg_loss:[92m 0.25988 [0m(-0.07448)
     | > avg_log_mle:[92m -0.45352 [0m(-0.00256)
     | > avg_loss_dur:[92m 0.71340 [0m(-0.07192)


[4m[1m > EPOCH: 432/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:27:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00601)
     | > avg_loss:[91m 0.36230 [0m(+0.10242)
     | > avg_log_mle:[91m -0.44007 [0m(+0.01345)
     | > avg_loss_dur:[91m 0.80237 [0m(+0.08897)


[4m[1m > EPOCH: 433/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:28:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 7800[0m
     | > loss: -0.25549  (-0.32492)
     | > log_mle: -0.47362  (-0.50194)
     | > loss_dur: 0.21814  (0.17702)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 17.87679  (9.76851)
     | > current_lr: 0.00011 
     | > step_time: 0.63860  (0.67195)
     | > loader_time: 0.38840  (0.40787)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00500)
     | > avg_loss:[92m 0.24840 [0m(-0.11390)
     | > avg_log_mle:[91m -0.43869 [0m(+0.00138)
     | > avg_loss_dur:[92m 0.68708 [0m(-0.11528)


[4m[1m > EPOCH: 434/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:28:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 7825[0m
     | > loss: -0.21769  (-0.29132)
     | > log_mle: -0.47407  (-0.49456)
     | > loss_dur: 0.25639  (0.20324)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 20.95488  (17.80573)
     | > current_lr: 0.00011 
     | > step_time: 0.78470  (0.71896)
     | > loader_time: 0.47040  (0.44918)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00300)
     | > avg_loss:[91m 0.33537 [0m(+0.08698)
     | > avg_log_mle:[92m -0.45772 [0m(-0.01904)
     | > avg_loss_dur:[91m 0.79310 [0m(+0.10601)


[4m[1m > EPOCH: 435/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:29:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00200)
     | > avg_loss:[92m 0.28910 [0m(-0.04627)
     | > avg_log_mle:[92m -0.46255 [0m(-0.00483)
     | > avg_loss_dur:[92m 0.75165 [0m(-0.04145)


[4m[1m > EPOCH: 436/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:29:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 7850[0m
     | > loss: -0.39640  (-0.40717)
     | > log_mle: -0.53386  (-0.53758)
     | > loss_dur: 0.13746  (0.13041)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.74021  (9.81563)
     | > current_lr: 0.00011 
     | > step_time: 0.56550  (0.60955)
     | > loader_time: 0.36730  (0.37584)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00400)
     | > avg_loss:[91m 0.30477 [0m(+0.01567)
     | > avg_log_mle:[91m -0.46025 [0m(+0.00230)
     | > avg_loss_dur:[91m 0.76501 [0m(+0.01337)


[4m[1m > EPOCH: 437/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:30:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 7875[0m
     | > loss: -0.30111  (-0.33849)
     | > log_mle: -0.50628  (-0.51607)
     | > loss_dur: 0.20517  (0.17758)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 18.07783  (14.60309)
     | > current_lr: 0.00011 
     | > step_time: 0.86980  (0.68941)
     | > loader_time: 0.61360  (0.43439)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 0.30116 [0m(-0.00361)
     | > avg_log_mle:[91m -0.45571 [0m(+0.00454)
     | > avg_loss_dur:[92m 0.75687 [0m(-0.00815)


[4m[1m > EPOCH: 438/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:30:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 7900[0m
     | > loss: -0.23769  (-0.29903)
     | > log_mle: -0.46772  (-0.49584)
     | > loss_dur: 0.23003  (0.19681)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.81688  (14.82594)
     | > current_lr: 0.00011 
     | > step_time: 0.95290  (0.76476)
     | > loader_time: 0.62550  (0.49188)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00400)
     | > avg_loss:[91m 0.31762 [0m(+0.01646)
     | > avg_log_mle:[91m -0.45424 [0m(+0.00147)
     | > avg_loss_dur:[91m 0.77186 [0m(+0.01499)


[4m[1m > EPOCH: 439/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:31:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00400)
     | > avg_loss:[92m 0.31648 [0m(-0.00115)
     | > avg_log_mle:[92m -0.45604 [0m(-0.00180)
     | > avg_loss_dur:[91m 0.77251 [0m(+0.00066)


[4m[1m > EPOCH: 440/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:31:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 7925[0m
     | > loss: -0.27086  (-0.34609)
     | > log_mle: -0.49061  (-0.51229)
     | > loss_dur: 0.21975  (0.16620)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.31286  (9.05103)
     | > current_lr: 0.00011 
     | > step_time: 0.74670  (0.67521)
     | > loader_time: 0.44740  (0.40517)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00300)
     | > avg_loss:[91m 0.38646 [0m(+0.06998)
     | > avg_log_mle:[91m -0.43892 [0m(+0.01712)
     | > avg_loss_dur:[91m 0.82538 [0m(+0.05286)


[4m[1m > EPOCH: 441/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:32:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 7950[0m
     | > loss: -0.26551  (-0.31293)
     | > log_mle: -0.48974  (-0.50124)
     | > loss_dur: 0.22423  (0.18831)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.46028  (17.81054)
     | > current_lr: 0.00011 
     | > step_time: 0.91880  (0.71473)
     | > loader_time: 0.62360  (0.45024)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00000)
     | > avg_loss:[92m 0.31997 [0m(-0.06649)
     | > avg_log_mle:[92m -0.45292 [0m(-0.01400)
     | > avg_loss_dur:[92m 0.77289 [0m(-0.05249)


[4m[1m > EPOCH: 442/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:32:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00200)
     | > avg_loss:[91m 0.34987 [0m(+0.02990)
     | > avg_log_mle:[92m -0.46321 [0m(-0.01029)
     | > avg_loss_dur:[91m 0.81308 [0m(+0.04019)


[4m[1m > EPOCH: 443/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:33:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 7975[0m
     | > loss: -0.42745  (-0.42745)
     | > log_mle: -0.54329  (-0.54329)
     | > loss_dur: 0.11584  (0.11584)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.96865  (10.96865)
     | > current_lr: 0.00011 
     | > step_time: 0.65060  (0.65059)
     | > loader_time: 0.38530  (0.38535)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00801)
     | > avg_loss:[92m 0.29806 [0m(-0.05181)
     | > avg_log_mle:[91m -0.45310 [0m(+0.01011)
     | > avg_loss_dur:[92m 0.75116 [0m(-0.06192)


[4m[1m > EPOCH: 444/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:33:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 8000[0m
     | > loss: -0.30011  (-0.34234)
     | > log_mle: -0.51087  (-0.51430)
     | > loss_dur: 0.21075  (0.17195)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 15.24535  (15.93307)
     | > current_lr: 0.00011 
     | > step_time: 0.67960  (0.66598)
     | > loader_time: 0.39640  (0.40324)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00500)
     | > avg_loss:[91m 0.29894 [0m(+0.00088)
     | > avg_log_mle:[91m -0.45264 [0m(+0.00047)
     | > avg_loss_dur:[91m 0.75158 [0m(+0.00042)


[4m[1m > EPOCH: 445/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:34:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 8025[0m
     | > loss: -0.27899  (-0.32085)
     | > log_mle: -0.48778  (-0.50734)
     | > loss_dur: 0.20879  (0.18649)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 16.64846  (13.02239)
     | > current_lr: 0.00011 
     | > step_time: 0.87380  (0.75269)
     | > loader_time: 0.51450  (0.47163)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00200)
     | > avg_loss:[91m 0.32459 [0m(+0.02565)
     | > avg_log_mle:[92m -0.46048 [0m(-0.00784)
     | > avg_loss_dur:[91m 0.78506 [0m(+0.03349)


[4m[1m > EPOCH: 446/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:34:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00100)
     | > avg_loss:[92m 0.30409 [0m(-0.02049)
     | > avg_log_mle:[92m -0.46118 [0m(-0.00070)
     | > avg_loss_dur:[92m 0.76527 [0m(-0.01979)


[4m[1m > EPOCH: 447/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:35:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 8050[0m
     | > loss: -0.36499  (-0.39795)
     | > log_mle: -0.52417  (-0.53729)
     | > loss_dur: 0.15919  (0.13934)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.89447  (7.76490)
     | > current_lr: 0.00011 
     | > step_time: 0.73770  (0.65910)
     | > loader_time: 0.49540  (0.41062)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00100)
     | > avg_loss:[92m 0.28970 [0m(-0.01439)
     | > avg_log_mle:[91m -0.42932 [0m(+0.03186)
     | > avg_loss_dur:[92m 0.71902 [0m(-0.04625)


[4m[1m > EPOCH: 448/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:36:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 8075[0m
     | > loss: -0.27724  (-0.29072)
     | > log_mle: -0.49067  (-0.49058)
     | > loss_dur: 0.21343  (0.19986)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.09423  (11.50724)
     | > current_lr: 0.00011 
     | > step_time: 0.73570  (0.69754)
     | > loader_time: 0.45440  (0.43967)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00100)
     | > avg_loss:[91m 0.30545 [0m(+0.01575)
     | > avg_log_mle:[92m -0.44604 [0m(-0.01672)
     | > avg_loss_dur:[91m 0.75150 [0m(+0.03247)


[4m[1m > EPOCH: 449/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:36:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[91m 0.40811 [0m(+0.10266)
     | > avg_log_mle:[91m -0.43047 [0m(+0.01558)
     | > avg_loss_dur:[91m 0.83858 [0m(+0.08708)


[4m[1m > EPOCH: 450/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:37:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 8100[0m
     | > loss: -0.34258  (-0.34258)
     | > log_mle: -0.51211  (-0.51211)
     | > loss_dur: 0.16953  (0.16953)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.29033  (13.29033)
     | > current_lr: 0.00011 
     | > step_time: 0.50050  (0.50046)
     | > loader_time: 0.26420  (0.26423)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00000)
     | > avg_loss:[92m 0.33892 [0m(-0.06920)
     | > avg_log_mle:[91m -0.42061 [0m(+0.00985)
     | > avg_loss_dur:[92m 0.75953 [0m(-0.07905)


[4m[1m > EPOCH: 451/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:37:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 8125[0m
     | > loss: -0.25834  (-0.30305)
     | > log_mle: -0.49378  (-0.49702)
     | > loss_dur: 0.23544  (0.19397)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 3.85715  (7.98972)
     | > current_lr: 0.00011 
     | > step_time: 0.64160  (0.66718)
     | > loader_time: 0.41440  (0.41423)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00400)
     | > avg_loss:[92m 0.32966 [0m(-0.00926)
     | > avg_log_mle:[92m -0.44992 [0m(-0.02930)
     | > avg_loss_dur:[91m 0.77957 [0m(+0.02004)


[4m[1m > EPOCH: 452/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:38:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 8150[0m
     | > loss: -0.25164  (-0.30422)
     | > log_mle: -0.47928  (-0.50511)
     | > loss_dur: 0.22764  (0.20089)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.50403  (14.52322)
     | > current_lr: 0.00011 
     | > step_time: 1.02190  (0.74003)
     | > loader_time: 0.58050  (0.47050)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00801)
     | > avg_loss:[92m 0.30857 [0m(-0.02109)
     | > avg_log_mle:[92m -0.46612 [0m(-0.01620)
     | > avg_loss_dur:[92m 0.77469 [0m(-0.00489)


[4m[1m > EPOCH: 453/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:38:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01101)
     | > avg_loss:[92m 0.29108 [0m(-0.01749)
     | > avg_log_mle:[91m -0.44860 [0m(+0.01752)
     | > avg_loss_dur:[92m 0.73968 [0m(-0.03501)


[4m[1m > EPOCH: 454/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:39:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 8175[0m
     | > loss: -0.39510  (-0.40530)
     | > log_mle: -0.53554  (-0.53754)
     | > loss_dur: 0.14043  (0.13224)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.33495  (7.54477)
     | > current_lr: 0.00011 
     | > step_time: 0.68660  (0.63158)
     | > loader_time: 0.47640  (0.40670)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00601)
     | > avg_loss:[91m 0.33769 [0m(+0.04662)
     | > avg_log_mle:[91m -0.44784 [0m(+0.00076)
     | > avg_loss_dur:[91m 0.78553 [0m(+0.04585)


[4m[1m > EPOCH: 455/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:39:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 8200[0m
     | > loss: -0.30474  (-0.33582)
     | > log_mle: -0.48985  (-0.51355)
     | > loss_dur: 0.18512  (0.17772)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.28261  (13.40027)
     | > current_lr: 0.00011 
     | > step_time: 0.70760  (0.69273)
     | > loader_time: 0.44940  (0.43309)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00501)
     | > avg_loss:[92m 0.33456 [0m(-0.00313)
     | > avg_log_mle:[92m -0.46153 [0m(-0.01370)
     | > avg_loss_dur:[91m 0.79609 [0m(+0.01056)


[4m[1m > EPOCH: 456/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:40:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 8225[0m
     | > loss: -0.25926  (-0.31866)
     | > log_mle: -0.48246  (-0.50652)
     | > loss_dur: 0.22320  (0.18786)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 35.24319  (12.16968)
     | > current_lr: 0.00011 
     | > step_time: 0.84880  (0.77069)
     | > loader_time: 0.45640  (0.47678)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00400)
     | > avg_loss:[92m 0.29830 [0m(-0.03626)
     | > avg_log_mle:[91m -0.44386 [0m(+0.01767)
     | > avg_loss_dur:[92m 0.74216 [0m(-0.05393)


[4m[1m > EPOCH: 457/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:40:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.01101)
     | > avg_loss:[91m 0.38332 [0m(+0.08502)
     | > avg_log_mle:[92m -0.44988 [0m(-0.00602)
     | > avg_loss_dur:[91m 0.83321 [0m(+0.09104)


[4m[1m > EPOCH: 458/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:41:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 8250[0m
     | > loss: -0.29918  (-0.36505)
     | > log_mle: -0.49174  (-0.52071)
     | > loss_dur: 0.19256  (0.15567)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.85287  (15.59434)
     | > current_lr: 0.00011 
     | > step_time: 0.63920  (0.66989)
     | > loader_time: 0.44520  (0.42768)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00701)
     | > avg_loss:[92m 0.31280 [0m(-0.07052)
     | > avg_log_mle:[92m -0.45431 [0m(-0.00443)
     | > avg_loss_dur:[92m 0.76712 [0m(-0.06609)


[4m[1m > EPOCH: 459/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:41:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 8275[0m
     | > loss: -0.24946  (-0.32457)
     | > log_mle: -0.48800  (-0.51122)
     | > loss_dur: 0.23854  (0.18665)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.18295  (9.07082)
     | > current_lr: 0.00011 
     | > step_time: 0.78370  (0.71919)
     | > loader_time: 0.49650  (0.46250)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00801)
     | > avg_loss:[91m 0.32793 [0m(+0.01513)
     | > avg_log_mle:[92m -0.45617 [0m(-0.00185)
     | > avg_loss_dur:[91m 0.78410 [0m(+0.01698)


[4m[1m > EPOCH: 460/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:42:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00701)
     | > avg_loss:[92m 0.28688 [0m(-0.04105)
     | > avg_log_mle:[92m -0.46360 [0m(-0.00744)
     | > avg_loss_dur:[92m 0.75048 [0m(-0.03361)


[4m[1m > EPOCH: 461/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:42:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 8300[0m
     | > loss: -0.40117  (-0.41055)
     | > log_mle: -0.53731  (-0.54250)
     | > loss_dur: 0.13614  (0.13195)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.81869  (14.36894)
     | > current_lr: 0.00012 
     | > step_time: 0.56050  (0.60605)
     | > loader_time: 0.34730  (0.34631)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00801)
     | > avg_loss:[91m 0.30376 [0m(+0.01687)
     | > avg_log_mle:[91m -0.46258 [0m(+0.00102)
     | > avg_loss_dur:[91m 0.76634 [0m(+0.01585)


[4m[1m > EPOCH: 462/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:43:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 8325[0m
     | > loss: -0.33373  (-0.36451)
     | > log_mle: -0.52257  (-0.52982)
     | > loss_dur: 0.18885  (0.16532)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.30777  (12.58621)
     | > current_lr: 0.00012 
     | > step_time: 0.88680  (0.69675)
     | > loader_time: 0.60950  (0.44818)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01001)
     | > avg_loss:[92m 0.29694 [0m(-0.00681)
     | > avg_log_mle:[92m -0.46314 [0m(-0.00055)
     | > avg_loss_dur:[92m 0.76008 [0m(-0.00626)


[4m[1m > EPOCH: 463/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:43:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 8350[0m
     | > loss: -0.28661  (-0.33137)
     | > log_mle: -0.48846  (-0.51362)
     | > loss_dur: 0.20185  (0.18225)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.25255  (14.38006)
     | > current_lr: 0.00012 
     | > step_time: 0.95090  (0.76276)
     | > loader_time: 0.57250  (0.46842)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.01201)
     | > avg_loss:[91m 0.35138 [0m(+0.05444)
     | > avg_log_mle:[91m -0.46012 [0m(+0.00302)
     | > avg_loss_dur:[91m 0.81150 [0m(+0.05142)


[4m[1m > EPOCH: 464/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:44:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08508 [0m(+0.02302)
     | > avg_loss:[92m 0.29009 [0m(-0.06130)
     | > avg_log_mle:[91m -0.45481 [0m(+0.00530)
     | > avg_loss_dur:[92m 0.74490 [0m(-0.06660)


[4m[1m > EPOCH: 465/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:44:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 8375[0m
     | > loss: -0.33828  (-0.38511)
     | > log_mle: -0.51628  (-0.53409)
     | > loss_dur: 0.17800  (0.14898)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.85706  (6.55115)
     | > current_lr: 0.00012 
     | > step_time: 0.73770  (0.67181)
     | > loader_time: 0.50050  (0.45862)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.01201)
     | > avg_loss:[91m 0.33146 [0m(+0.04137)
     | > avg_log_mle:[92m -0.46021 [0m(-0.00540)
     | > avg_loss_dur:[91m 0.79167 [0m(+0.04677)


[4m[1m > EPOCH: 466/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:45:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 8400[0m
     | > loss: -0.32393  (-0.35217)
     | > log_mle: -0.51223  (-0.52298)
     | > loss_dur: 0.18830  (0.17081)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.00215  (13.88776)
     | > current_lr: 0.00012 
     | > step_time: 0.91080  (0.71665)
     | > loader_time: 0.64860  (0.46584)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00300)
     | > avg_loss:[92m 0.28872 [0m(-0.04274)
     | > avg_log_mle:[91m -0.44643 [0m(+0.01378)
     | > avg_loss_dur:[92m 0.73515 [0m(-0.05652)


[4m[1m > EPOCH: 467/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:46:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[91m 0.33843 [0m(+0.04971)
     | > avg_log_mle:[92m -0.45181 [0m(-0.00538)
     | > avg_loss_dur:[91m 0.79024 [0m(+0.05508)


[4m[1m > EPOCH: 468/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:46:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 8425[0m
     | > loss: -0.42624  (-0.42624)
     | > log_mle: -0.55018  (-0.55018)
     | > loss_dur: 0.12395  (0.12395)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.03720  (9.03720)
     | > current_lr: 0.00012 
     | > step_time: 0.65060  (0.65059)
     | > loader_time: 0.36330  (0.36333)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00100)
     | > avg_loss:[91m 0.34314 [0m(+0.00472)
     | > avg_log_mle:[92m -0.46509 [0m(-0.01328)
     | > avg_loss_dur:[91m 0.80824 [0m(+0.01800)


[4m[1m > EPOCH: 469/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:47:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 8450[0m
     | > loss: -0.33908  (-0.38055)
     | > log_mle: -0.52909  (-0.53533)
     | > loss_dur: 0.19001  (0.15478)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.57931  (15.50916)
     | > current_lr: 0.00012 
     | > step_time: 0.67660  (0.66973)
     | > loader_time: 0.41240  (0.41212)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00400)
     | > avg_loss:[92m 0.34214 [0m(-0.00101)
     | > avg_log_mle:[91m -0.46112 [0m(+0.00397)
     | > avg_loss_dur:[92m 0.80326 [0m(-0.00498)


[4m[1m > EPOCH: 470/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:47:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 8475[0m
     | > loss: -0.28539  (-0.35170)
     | > log_mle: -0.49738  (-0.52293)
     | > loss_dur: 0.21199  (0.17123)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.69286  (15.67545)
     | > current_lr: 0.00012 
     | > step_time: 0.87280  (0.74902)
     | > loader_time: 0.55450  (0.48390)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00100)
     | > avg_loss:[92m 0.30462 [0m(-0.03752)
     | > avg_log_mle:[92m -0.46515 [0m(-0.00403)
     | > avg_loss_dur:[92m 0.76977 [0m(-0.03349)


[4m[1m > EPOCH: 471/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:48:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.01201)
     | > avg_loss:[91m 0.32592 [0m(+0.02130)
     | > avg_log_mle:[91m -0.45518 [0m(+0.00997)
     | > avg_loss_dur:[91m 0.78110 [0m(+0.01133)


[4m[1m > EPOCH: 472/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:48:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 8500[0m
     | > loss: -0.36259  (-0.40418)
     | > log_mle: -0.52614  (-0.54030)
     | > loss_dur: 0.16356  (0.13612)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.00268  (10.49752)
     | > current_lr: 0.00012 
     | > step_time: 0.73070  (0.65635)
     | > loader_time: 0.51950  (0.40612)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06506 [0m(+0.00400)
     | > avg_loss:[92m 0.29835 [0m(-0.02757)
     | > avg_log_mle:[91m -0.44846 [0m(+0.00673)
     | > avg_loss_dur:[92m 0.74680 [0m(-0.03430)


[4m[1m > EPOCH: 473/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:49:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 8525[0m
     | > loss: -0.34165  (-0.35525)
     | > log_mle: -0.51500  (-0.52180)
     | > loss_dur: 0.17335  (0.16654)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.43488  (17.86962)
     | > current_lr: 0.00012 
     | > step_time: 0.74670  (0.69955)
     | > loader_time: 0.46440  (0.43021)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00300)
     | > avg_loss:[91m 0.31967 [0m(+0.02132)
     | > avg_log_mle:[92m -0.45572 [0m(-0.00726)
     | > avg_loss_dur:[91m 0.77539 [0m(+0.02859)


[4m[1m > EPOCH: 474/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:49:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.00701)
     | > avg_loss:[91m 0.33347 [0m(+0.01380)
     | > avg_log_mle:[92m -0.46179 [0m(-0.00607)
     | > avg_loss_dur:[91m 0.79526 [0m(+0.01987)


[4m[1m > EPOCH: 475/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:50:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 8550[0m
     | > loss: -0.44816  (-0.44816)
     | > log_mle: -0.56301  (-0.56301)
     | > loss_dur: 0.11484  (0.11484)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.73164  (25.73164)
     | > current_lr: 0.00012 
     | > step_time: 0.61660  (0.61656)
     | > loader_time: 0.28230  (0.28226)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00601)
     | > avg_loss:[92m 0.29912 [0m(-0.03434)
     | > avg_log_mle:[91m -0.45427 [0m(+0.00752)
     | > avg_loss_dur:[92m 0.75339 [0m(-0.04186)


[4m[1m > EPOCH: 476/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:50:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 8575[0m
     | > loss: -0.28871  (-0.36686)
     | > log_mle: -0.50055  (-0.52712)
     | > loss_dur: 0.21184  (0.16026)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 27.15804  (14.86262)
     | > current_lr: 0.00012 
     | > step_time: 0.64960  (0.66246)
     | > loader_time: 0.43840  (0.41566)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.06706 [0m(+0.00000)
     | > avg_loss:[91m 0.35815 [0m(+0.05903)
     | > avg_log_mle:[91m -0.44667 [0m(+0.00760)
     | > avg_loss_dur:[91m 0.80483 [0m(+0.05143)


[4m[1m > EPOCH: 477/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:51:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 8600[0m
     | > loss: -0.28958  (-0.32228)
     | > log_mle: -0.48822  (-0.51005)
     | > loss_dur: 0.19863  (0.18777)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.34283  (16.23135)
     | > current_lr: 0.00012 
     | > step_time: 1.02390  (0.74575)
     | > loader_time: 0.62160  (0.48322)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00501)
     | > avg_loss:[92m 0.32763 [0m(-0.03052)
     | > avg_log_mle:[92m -0.46129 [0m(-0.01462)
     | > avg_loss_dur:[92m 0.78892 [0m(-0.01591)


[4m[1m > EPOCH: 478/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:51:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.00701)
     | > avg_loss:[92m 0.27663 [0m(-0.05100)
     | > avg_log_mle:[91m -0.46113 [0m(+0.00016)
     | > avg_loss_dur:[92m 0.73776 [0m(-0.05116)


[4m[1m > EPOCH: 479/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:52:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 8625[0m
     | > loss: -0.43112  (-0.43212)
     | > log_mle: -0.55766  (-0.55610)
     | > loss_dur: 0.12654  (0.12398)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.40373  (13.47946)
     | > current_lr: 0.00012 
     | > step_time: 0.68460  (0.63491)
     | > loader_time: 0.39940  (0.37467)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07407 [0m(-0.00501)
     | > avg_loss:[91m 0.31453 [0m(+0.03790)
     | > avg_log_mle:[91m -0.45600 [0m(+0.00512)
     | > avg_loss_dur:[91m 0.77054 [0m(+0.03278)


[4m[1m > EPOCH: 480/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:52:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 8650[0m
     | > loss: -0.33859  (-0.37457)
     | > log_mle: -0.50302  (-0.53050)
     | > loss_dur: 0.16442  (0.15593)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.92897  (8.52446)
     | > current_lr: 0.00012 
     | > step_time: 0.69860  (0.69133)
     | > loader_time: 0.47640  (0.43309)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08207 [0m(+0.00801)
     | > avg_loss:[92m 0.31340 [0m(-0.00113)
     | > avg_log_mle:[91m -0.44172 [0m(+0.01428)
     | > avg_loss_dur:[92m 0.75512 [0m(-0.01541)


[4m[1m > EPOCH: 481/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:53:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 8675[0m
     | > loss: -0.29905  (-0.33876)
     | > log_mle: -0.49749  (-0.51156)
     | > loss_dur: 0.19844  (0.17280)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.60787  (16.05185)
     | > current_lr: 0.00012 
     | > step_time: 0.84580  (0.76891)
     | > loader_time: 0.43540  (0.46748)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07407 [0m(-0.00801)
     | > avg_loss:[91m 0.33718 [0m(+0.02378)
     | > avg_log_mle:[92m -0.44642 [0m(-0.00470)
     | > avg_loss_dur:[91m 0.78361 [0m(+0.02848)


[4m[1m > EPOCH: 482/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:53:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00500)
     | > avg_loss:[92m 0.32843 [0m(-0.00875)
     | > avg_log_mle:[92m -0.45442 [0m(-0.00800)
     | > avg_loss_dur:[92m 0.78285 [0m(-0.00075)


[4m[1m > EPOCH: 483/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:54:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 8700[0m
     | > loss: -0.31803  (-0.38647)
     | > log_mle: -0.50482  (-0.53526)
     | > loss_dur: 0.18679  (0.14879)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.18064  (13.23356)
     | > current_lr: 0.00012 
     | > step_time: 0.63660  (0.66844)
     | > loader_time: 0.39540  (0.41321)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[91m 0.35412 [0m(+0.02569)
     | > avg_log_mle:[92m -0.45699 [0m(-0.00257)
     | > avg_loss_dur:[91m 0.81111 [0m(+0.02826)


[4m[1m > EPOCH: 484/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:54:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 8725[0m
     | > loss: -0.29072  (-0.36193)
     | > log_mle: -0.50107  (-0.52740)
     | > loss_dur: 0.21035  (0.16547)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.83283  (15.03406)
     | > current_lr: 0.00012 
     | > step_time: 0.78470  (0.72096)
     | > loader_time: 0.53050  (0.46250)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00000)
     | > avg_loss:[92m 0.31823 [0m(-0.03589)
     | > avg_log_mle:[91m -0.45065 [0m(+0.00635)
     | > avg_loss_dur:[92m 0.76888 [0m(-0.04224)


[4m[1m > EPOCH: 485/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:55:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00200)
     | > avg_loss:[91m 0.33621 [0m(+0.01798)
     | > avg_log_mle:[92m -0.46281 [0m(-0.01216)
     | > avg_loss_dur:[91m 0.79902 [0m(+0.03014)


[4m[1m > EPOCH: 486/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:56:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 8750[0m
     | > loss: -0.42114  (-0.43765)
     | > log_mle: -0.54994  (-0.55849)
     | > loss_dur: 0.12880  (0.12084)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.69057  (7.73030)
     | > current_lr: 0.00012 
     | > step_time: 0.56650  (0.61006)
     | > loader_time: 0.33530  (0.35032)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00300)
     | > avg_loss:[92m 0.29444 [0m(-0.04177)
     | > avg_log_mle:[91m -0.45873 [0m(+0.00407)
     | > avg_loss_dur:[92m 0.75318 [0m(-0.04584)


[4m[1m > EPOCH: 487/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:56:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 8775[0m
     | > loss: -0.35895  (-0.38159)
     | > log_mle: -0.53261  (-0.53709)
     | > loss_dur: 0.17367  (0.15550)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.69223  (11.08056)
     | > current_lr: 0.00012 
     | > step_time: 0.86980  (0.68885)
     | > loader_time: 0.59550  (0.42739)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[91m 0.32903 [0m(+0.03459)
     | > avg_log_mle:[92m -0.45877 [0m(-0.00003)
     | > avg_loss_dur:[91m 0.78780 [0m(+0.03462)


[4m[1m > EPOCH: 488/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:57:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 8800[0m
     | > loss: -0.32128  (-0.35972)
     | > log_mle: -0.50309  (-0.52599)
     | > loss_dur: 0.18180  (0.16627)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.39044  (18.28670)
     | > current_lr: 0.00012 
     | > step_time: 0.95490  (0.76545)
     | > loader_time: 0.58150  (0.48269)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00200)
     | > avg_loss:[92m 0.30294 [0m(-0.02609)
     | > avg_log_mle:[92m -0.46759 [0m(-0.00882)
     | > avg_loss_dur:[92m 0.77054 [0m(-0.01726)


[4m[1m > EPOCH: 489/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:57:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00701)
     | > avg_loss:[92m 0.29947 [0m(-0.00347)
     | > avg_log_mle:[91m -0.46571 [0m(+0.00189)
     | > avg_loss_dur:[92m 0.76518 [0m(-0.00536)


[4m[1m > EPOCH: 490/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:58:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 8825[0m
     | > loss: -0.36926  (-0.41648)
     | > log_mle: -0.53280  (-0.55248)
     | > loss_dur: 0.16355  (0.13600)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.87797  (8.57343)
     | > current_lr: 0.00012 
     | > step_time: 0.73970  (0.67301)
     | > loader_time: 0.44540  (0.40717)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.01001)
     | > avg_loss:[92m 0.27384 [0m(-0.02563)
     | > avg_log_mle:[91m -0.44977 [0m(+0.01594)
     | > avg_loss_dur:[92m 0.72361 [0m(-0.04157)


[4m[1m > EPOCH: 491/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:58:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 8850[0m
     | > loss: -0.30656  (-0.35301)
     | > log_mle: -0.50062  (-0.51975)
     | > loss_dur: 0.19406  (0.16675)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.40646  (16.80437)
     | > current_lr: 0.00012 
     | > step_time: 0.91680  (0.71674)
     | > loader_time: 0.68560  (0.45466)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07407 [0m(-0.00100)
     | > avg_loss:[91m 0.33365 [0m(+0.05981)
     | > avg_log_mle:[92m -0.45351 [0m(-0.00374)
     | > avg_loss_dur:[91m 0.78716 [0m(+0.06355)


[4m[1m > EPOCH: 492/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:59:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00701)
     | > avg_loss:[92m 0.30947 [0m(-0.02419)
     | > avg_log_mle:[92m -0.46138 [0m(-0.00787)
     | > avg_loss_dur:[92m 0.77084 [0m(-0.01632)


[4m[1m > EPOCH: 493/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 08:59:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 8875[0m
     | > loss: -0.43907  (-0.43907)
     | > log_mle: -0.55778  (-0.55778)
     | > loss_dur: 0.11871  (0.11871)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.10716  (7.10716)
     | > current_lr: 0.00012 
     | > step_time: 0.65160  (0.65159)
     | > loader_time: 0.40840  (0.40837)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[92m 0.26883 [0m(-0.04063)
     | > avg_log_mle:[91m -0.46089 [0m(+0.00049)
     | > avg_loss_dur:[92m 0.72972 [0m(-0.04112)


[4m[1m > EPOCH: 494/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:00:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 8900[0m
     | > loss: -0.32645  (-0.37246)
     | > log_mle: -0.51536  (-0.53140)
     | > loss_dur: 0.18891  (0.15895)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.06289  (17.11392)
     | > current_lr: 0.00012 
     | > step_time: 0.67760  (0.66704)
     | > loader_time: 0.41640  (0.40663)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[91m 0.33205 [0m(+0.06322)
     | > avg_log_mle:[92m -0.46397 [0m(-0.00308)
     | > avg_loss_dur:[91m 0.79602 [0m(+0.06630)


[4m[1m > EPOCH: 495/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:00:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 8925[0m
     | > loss: -0.28786  (-0.34077)
     | > log_mle: -0.49783  (-0.52047)
     | > loss_dur: 0.20998  (0.17970)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.34996  (15.26179)
     | > current_lr: 0.00012 
     | > step_time: 0.87280  (0.75502)
     | > loader_time: 0.58950  (0.48410)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01001)
     | > avg_loss:[91m 0.37251 [0m(+0.04046)
     | > avg_log_mle:[91m -0.45330 [0m(+0.01066)
     | > avg_loss_dur:[91m 0.82581 [0m(+0.02979)


[4m[1m > EPOCH: 496/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:01:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.01101)
     | > avg_loss:[92m 0.32979 [0m(-0.04272)
     | > avg_log_mle:[91m -0.44410 [0m(+0.00920)
     | > avg_loss_dur:[92m 0.77389 [0m(-0.05192)


[4m[1m > EPOCH: 497/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:01:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 8950[0m
     | > loss: -0.38517  (-0.42748)
     | > log_mle: -0.53704  (-0.55722)
     | > loss_dur: 0.15187  (0.12974)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.18809  (10.21119)
     | > current_lr: 0.00012 
     | > step_time: 0.73670  (0.66060)
     | > loader_time: 0.48540  (0.40512)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00200)
     | > avg_loss:[92m 0.32200 [0m(-0.00779)
     | > avg_log_mle:[92m -0.44924 [0m(-0.00514)
     | > avg_loss_dur:[92m 0.77124 [0m(-0.00265)


[4m[1m > EPOCH: 498/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:02:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 8975[0m
     | > loss: -0.36597  (-0.38050)
     | > log_mle: -0.52609  (-0.53735)
     | > loss_dur: 0.16012  (0.15685)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 31.32167  (14.78011)
     | > current_lr: 0.00012 
     | > step_time: 0.73970  (0.69581)
     | > loader_time: 0.44640  (0.42602)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00100)
     | > avg_loss:[91m 0.38476 [0m(+0.06276)
     | > avg_log_mle:[91m -0.44796 [0m(+0.00128)
     | > avg_loss_dur:[91m 0.83272 [0m(+0.06148)


[4m[1m > EPOCH: 499/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:02:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[92m 0.29509 [0m(-0.08966)
     | > avg_log_mle:[92m -0.45536 [0m(-0.00740)
     | > avg_loss_dur:[92m 0.75045 [0m(-0.08226)


[4m[1m > EPOCH: 500/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:03:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 9000[0m
     | > loss: -0.45424  (-0.45424)
     | > log_mle: -0.57005  (-0.57005)
     | > loss_dur: 0.11581  (0.11581)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.54515  (9.54515)
     | > current_lr: 0.00013 
     | > step_time: 0.50350  (0.50346)
     | > loader_time: 0.27630  (0.27625)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[91m 0.35635 [0m(+0.06126)
     | > avg_log_mle:[92m -0.46369 [0m(-0.00833)
     | > avg_loss_dur:[91m 0.82004 [0m(+0.06959)


[4m[1m > EPOCH: 501/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:03:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 9025[0m
     | > loss: -0.35443  (-0.40603)
     | > log_mle: -0.53246  (-0.55177)
     | > loss_dur: 0.17804  (0.14574)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.23613  (11.95303)
     | > current_lr: 0.00013 
     | > step_time: 0.64960  (0.66732)
     | > loader_time: 0.39140  (0.40279)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00901)
     | > avg_loss:[92m 0.29087 [0m(-0.06548)
     | > avg_log_mle:[91m -0.46326 [0m(+0.00044)
     | > avg_loss_dur:[92m 0.75413 [0m(-0.06592)


[4m[1m > EPOCH: 502/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:04:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 9050[0m
     | > loss: -0.32425  (-0.36649)
     | > log_mle: -0.50560  (-0.53506)
     | > loss_dur: 0.18135  (0.16857)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.69768  (14.23787)
     | > current_lr: 0.00013 
     | > step_time: 1.02090  (0.74103)
     | > loader_time: 0.59350  (0.49795)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00601)
     | > avg_loss:[91m 0.32327 [0m(+0.03240)
     | > avg_log_mle:[91m -0.45685 [0m(+0.00640)
     | > avg_loss_dur:[91m 0.78012 [0m(+0.02600)


[4m[1m > EPOCH: 503/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:05:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00801)
     | > avg_loss:[91m 0.34195 [0m(+0.01868)
     | > avg_log_mle:[91m -0.45523 [0m(+0.00163)
     | > avg_loss_dur:[91m 0.79717 [0m(+0.01705)


[4m[1m > EPOCH: 504/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:05:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 9075[0m
     | > loss: -0.42531  (-0.44407)
     | > log_mle: -0.56143  (-0.56560)
     | > loss_dur: 0.13612  (0.12153)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.86888  (6.33314)
     | > current_lr: 0.00013 
     | > step_time: 0.68660  (0.63191)
     | > loader_time: 0.40140  (0.36600)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00801)
     | > avg_loss:[92m 0.30590 [0m(-0.03605)
     | > avg_log_mle:[92m -0.45718 [0m(-0.00196)
     | > avg_loss_dur:[92m 0.76308 [0m(-0.03409)


[4m[1m > EPOCH: 505/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:06:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 9100[0m
     | > loss: -0.35068  (-0.37679)
     | > log_mle: -0.51457  (-0.53799)
     | > loss_dur: 0.16389  (0.16120)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.35039  (13.79081)
     | > current_lr: 0.00013 
     | > step_time: 0.70360  (0.69483)
     | > loader_time: 0.46240  (0.44480)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00300)
     | > avg_loss:[91m 0.33274 [0m(+0.02683)
     | > avg_log_mle:[92m -0.46302 [0m(-0.00584)
     | > avg_loss_dur:[91m 0.79576 [0m(+0.03268)


[4m[1m > EPOCH: 506/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:06:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 9125[0m
     | > loss: -0.33445  (-0.36005)
     | > log_mle: -0.50853  (-0.52910)
     | > loss_dur: 0.17407  (0.16905)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.93243  (14.43896)
     | > current_lr: 0.00013 
     | > step_time: 0.85580  (0.76894)
     | > loader_time: 0.42940  (0.47890)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00400)
     | > avg_loss:[92m 0.30495 [0m(-0.02779)
     | > avg_log_mle:[92m -0.46561 [0m(-0.00259)
     | > avg_loss_dur:[92m 0.77056 [0m(-0.02520)


[4m[1m > EPOCH: 507/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:07:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07207 [0m(+0.00000)
     | > avg_loss:[91m 0.33421 [0m(+0.02926)
     | > avg_log_mle:[91m -0.46014 [0m(+0.00547)
     | > avg_loss_dur:[91m 0.79435 [0m(+0.02379)


[4m[1m > EPOCH: 508/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:07:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 9150[0m
     | > loss: -0.34280  (-0.41763)
     | > log_mle: -0.51737  (-0.55550)
     | > loss_dur: 0.17457  (0.13787)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 37.54105  (15.13763)
     | > current_lr: 0.00013 
     | > step_time: 0.63860  (0.66844)
     | > loader_time: 0.42040  (0.42589)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.00701)
     | > avg_loss:[91m 0.34253 [0m(+0.00832)
     | > avg_log_mle:[92m -0.46448 [0m(-0.00434)
     | > avg_loss_dur:[91m 0.80701 [0m(+0.01266)


[4m[1m > EPOCH: 509/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:08:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 9175[0m
     | > loss: -0.28595  (-0.37078)
     | > log_mle: -0.50078  (-0.53557)
     | > loss_dur: 0.21482  (0.16479)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.89267  (16.90999)
     | > current_lr: 0.00013 
     | > step_time: 0.78770  (0.72081)
     | > loader_time: 0.50650  (0.44987)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00901)
     | > avg_loss:[92m 0.31425 [0m(-0.02828)
     | > avg_log_mle:[91m -0.45723 [0m(+0.00725)
     | > avg_loss_dur:[92m 0.77148 [0m(-0.03553)


[4m[1m > EPOCH: 510/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:08:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[91m 0.39411 [0m(+0.07986)
     | > avg_log_mle:[91m -0.43513 [0m(+0.02211)
     | > avg_loss_dur:[91m 0.82924 [0m(+0.05776)


[4m[1m > EPOCH: 511/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:09:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 9200[0m
     | > loss: -0.45748  (-0.45843)
     | > log_mle: -0.56759  (-0.56505)
     | > loss_dur: 0.11012  (0.10662)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.36257  (14.51664)
     | > current_lr: 0.00013 
     | > step_time: 0.56350  (0.61005)
     | > loader_time: 0.34430  (0.36884)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00000)
     | > avg_loss:[92m 0.31384 [0m(-0.08027)
     | > avg_log_mle:[92m -0.46061 [0m(-0.02548)
     | > avg_loss_dur:[92m 0.77445 [0m(-0.05479)


[4m[1m > EPOCH: 512/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:09:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 9225[0m
     | > loss: -0.35888  (-0.40121)
     | > log_mle: -0.53970  (-0.55143)
     | > loss_dur: 0.18082  (0.15022)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.12558  (16.48932)
     | > current_lr: 0.00013 
     | > step_time: 0.87580  (0.69352)
     | > loader_time: 0.60860  (0.44707)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00300)
     | > avg_loss:[91m 0.34945 [0m(+0.03561)
     | > avg_log_mle:[91m -0.45842 [0m(+0.00219)
     | > avg_loss_dur:[91m 0.80788 [0m(+0.03343)


[4m[1m > EPOCH: 513/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:10:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 9250[0m
     | > loss: -0.32924  (-0.38259)
     | > log_mle: -0.50582  (-0.53996)
     | > loss_dur: 0.17658  (0.15737)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.61918  (13.22062)
     | > current_lr: 0.00013 
     | > step_time: 0.95790  (0.76213)
     | > loader_time: 0.61760  (0.51353)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00100)
     | > avg_loss:[92m 0.29218 [0m(-0.05728)
     | > avg_log_mle:[92m -0.46271 [0m(-0.00429)
     | > avg_loss_dur:[92m 0.75489 [0m(-0.05298)


[4m[1m > EPOCH: 514/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:10:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.00601)
     | > avg_loss:[92m 0.28892 [0m(-0.00326)
     | > avg_log_mle:[91m -0.45612 [0m(+0.00660)
     | > avg_loss_dur:[92m 0.74503 [0m(-0.00986)


[4m[1m > EPOCH: 515/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:11:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 9275[0m
     | > loss: -0.37916  (-0.44492)
     | > log_mle: -0.53746  (-0.56766)
     | > loss_dur: 0.15831  (0.12274)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.16725  (15.92748)
     | > current_lr: 0.00013 
     | > step_time: 0.74070  (0.67201)
     | > loader_time: 0.46740  (0.41738)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.01001)
     | > avg_loss:[91m 0.33573 [0m(+0.04681)
     | > avg_log_mle:[92m -0.45746 [0m(-0.00134)
     | > avg_loss_dur:[91m 0.79319 [0m(+0.04815)


[4m[1m > EPOCH: 516/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:11:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 9300[0m
     | > loss: -0.32984  (-0.39197)
     | > log_mle: -0.51853  (-0.54377)
     | > loss_dur: 0.18870  (0.15180)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.04572  (13.63300)
     | > current_lr: 0.00013 
     | > step_time: 0.91480  (0.71507)
     | > loader_time: 0.62960  (0.45408)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00500)
     | > avg_loss:[91m 0.39988 [0m(+0.06415)
     | > avg_log_mle:[91m -0.44514 [0m(+0.01232)
     | > avg_loss_dur:[91m 0.84502 [0m(+0.05183)


[4m[1m > EPOCH: 517/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:12:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00400)
     | > avg_loss:[92m 0.32580 [0m(-0.07408)
     | > avg_log_mle:[91m -0.44208 [0m(+0.00306)
     | > avg_loss_dur:[92m 0.76788 [0m(-0.07714)


[4m[1m > EPOCH: 518/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:12:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 9325[0m
     | > loss: -0.46149  (-0.46149)
     | > log_mle: -0.57399  (-0.57399)
     | > loss_dur: 0.11250  (0.11250)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.89408  (10.89408)
     | > current_lr: 0.00013 
     | > step_time: 0.65060  (0.65059)
     | > loader_time: 0.37230  (0.37234)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00300)
     | > avg_loss:[92m 0.32013 [0m(-0.00567)
     | > avg_log_mle:[92m -0.45438 [0m(-0.01230)
     | > avg_loss_dur:[91m 0.77451 [0m(+0.00662)


[4m[1m > EPOCH: 519/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:13:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 9350[0m
     | > loss: -0.39410  (-0.41574)
     | > log_mle: -0.55372  (-0.55992)
     | > loss_dur: 0.15963  (0.14418)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.68940  (16.18508)
     | > current_lr: 0.00013 
     | > step_time: 0.68460  (0.67049)
     | > loader_time: 0.41840  (0.40787)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00200)
     | > avg_loss:[91m 0.33479 [0m(+0.01466)
     | > avg_log_mle:[92m -0.45855 [0m(-0.00417)
     | > avg_loss_dur:[91m 0.79334 [0m(+0.01883)


[4m[1m > EPOCH: 520/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:13:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 9375[0m
     | > loss: -0.32011  (-0.38539)
     | > log_mle: -0.51187  (-0.54293)
     | > loss_dur: 0.19176  (0.15754)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.99402  (15.29284)
     | > current_lr: 0.00013 
     | > step_time: 0.87580  (0.74915)
     | > loader_time: 0.54650  (0.48878)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00501)
     | > avg_loss:[91m 0.38879 [0m(+0.05400)
     | > avg_log_mle:[91m -0.43932 [0m(+0.01923)
     | > avg_loss_dur:[91m 0.82811 [0m(+0.03477)


[4m[1m > EPOCH: 521/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:14:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07507 [0m(-0.00100)
     | > avg_loss:[91m 0.39566 [0m(+0.00687)
     | > avg_log_mle:[91m -0.43609 [0m(+0.00323)
     | > avg_loss_dur:[91m 0.83175 [0m(+0.00364)


[4m[1m > EPOCH: 522/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:14:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 9400[0m
     | > loss: -0.40834  (-0.44573)
     | > log_mle: -0.55094  (-0.56741)
     | > loss_dur: 0.14260  (0.12168)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.83443  (7.48789)
     | > current_lr: 0.00013 
     | > step_time: 0.72970  (0.65835)
     | > loader_time: 0.57750  (0.42864)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07507 [0m(-0.00000)
     | > avg_loss:[92m 0.37339 [0m(-0.02227)
     | > avg_log_mle:[92m -0.45579 [0m(-0.01970)
     | > avg_loss_dur:[92m 0.82918 [0m(-0.00257)


[4m[1m > EPOCH: 523/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:15:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 9425[0m
     | > loss: -0.38096  (-0.40119)
     | > log_mle: -0.53680  (-0.55176)
     | > loss_dur: 0.15585  (0.15057)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.61905  (8.88204)
     | > current_lr: 0.00013 
     | > step_time: 0.75170  (0.69854)
     | > loader_time: 0.45540  (0.43285)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00300)
     | > avg_loss:[91m 0.38710 [0m(+0.01371)
     | > avg_log_mle:[92m -0.45633 [0m(-0.00055)
     | > avg_loss_dur:[91m 0.84343 [0m(+0.01425)


[4m[1m > EPOCH: 524/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:16:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06005 [0m(-0.01201)
     | > avg_loss:[92m 0.32630 [0m(-0.06080)
     | > avg_log_mle:[91m -0.45093 [0m(+0.00541)
     | > avg_loss_dur:[92m 0.77723 [0m(-0.06620)


[4m[1m > EPOCH: 525/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:16:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 9450[0m
     | > loss: -0.46637  (-0.46637)
     | > log_mle: -0.57375  (-0.57375)
     | > loss_dur: 0.10737  (0.10737)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.71664  (22.71664)
     | > current_lr: 0.00013 
     | > step_time: 0.59750  (0.59754)
     | > loader_time: 0.27920  (0.27924)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.01201)
     | > avg_loss:[91m 0.33832 [0m(+0.01202)
     | > avg_log_mle:[92m -0.46427 [0m(-0.01335)
     | > avg_loss_dur:[91m 0.80259 [0m(+0.02537)


[4m[1m > EPOCH: 526/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:17:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 9475[0m
     | > loss: -0.38656  (-0.42566)
     | > log_mle: -0.54783  (-0.56024)
     | > loss_dur: 0.16127  (0.13458)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.27099  (17.47948)
     | > current_lr: 0.00013 
     | > step_time: 0.65260  (0.66732)
     | > loader_time: 0.42240  (0.46013)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07206 [0m(+0.00000)
     | > avg_loss:[91m 0.38782 [0m(+0.04950)
     | > avg_log_mle:[91m -0.45133 [0m(+0.01294)
     | > avg_loss_dur:[91m 0.83915 [0m(+0.03656)


[4m[1m > EPOCH: 527/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:17:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 9500[0m
     | > loss: -0.33925  (-0.38226)
     | > log_mle: -0.50858  (-0.53614)
     | > loss_dur: 0.16932  (0.15387)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.37500  (13.12813)
     | > current_lr: 0.00013 
     | > step_time: 1.02810  (0.74411)
     | > loader_time: 0.64560  (0.47064)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.39772 [0m(+0.00989)
     | > avg_log_mle:[91m -0.41857 [0m(+0.03276)
     | > avg_loss_dur:[92m 0.81628 [0m(-0.02287)


[4m[1m > EPOCH: 528/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:18:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00200)
     | > avg_loss:[92m 0.38994 [0m(-0.00777)
     | > avg_log_mle:[92m -0.44588 [0m(-0.02731)
     | > avg_loss_dur:[91m 0.83582 [0m(+0.01954)


[4m[1m > EPOCH: 529/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:18:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 9525[0m
     | > loss: -0.46646  (-0.46044)
     | > log_mle: -0.57905  (-0.57174)
     | > loss_dur: 0.11259  (0.11130)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.99051  (9.67145)
     | > current_lr: 0.00013 
     | > step_time: 0.69260  (0.63825)
     | > loader_time: 0.42540  (0.39336)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00400)
     | > avg_loss:[92m 0.34647 [0m(-0.04347)
     | > avg_log_mle:[92m -0.46497 [0m(-0.01910)
     | > avg_loss_dur:[92m 0.81145 [0m(-0.02437)


[4m[1m > EPOCH: 530/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:19:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 9550[0m
     | > loss: -0.36231  (-0.39969)
     | > log_mle: -0.51720  (-0.54483)
     | > loss_dur: 0.15489  (0.14514)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.19969  (15.02944)
     | > current_lr: 0.00013 
     | > step_time: 0.70360  (0.69203)
     | > loader_time: 0.48740  (0.43249)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00801)
     | > avg_loss:[91m 0.35581 [0m(+0.00933)
     | > avg_log_mle:[91m -0.44691 [0m(+0.01806)
     | > avg_loss_dur:[92m 0.80272 [0m(-0.00873)


[4m[1m > EPOCH: 531/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:19:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 9575[0m
     | > loss: -0.32739  (-0.37767)
     | > log_mle: -0.50821  (-0.53604)
     | > loss_dur: 0.18082  (0.15838)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 51.49485  (19.24984)
     | > current_lr: 0.00013 
     | > step_time: 0.84380  (0.76788)
     | > loader_time: 0.40040  (0.47790)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01301)
     | > avg_loss:[91m 0.37989 [0m(+0.02409)
     | > avg_log_mle:[92m -0.44841 [0m(-0.00149)
     | > avg_loss_dur:[91m 0.82830 [0m(+0.02558)


[4m[1m > EPOCH: 532/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:20:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.01201)
     | > avg_loss:[92m 0.36393 [0m(-0.01596)
     | > avg_log_mle:[92m -0.46270 [0m(-0.01429)
     | > avg_loss_dur:[92m 0.82663 [0m(-0.00167)


[4m[1m > EPOCH: 533/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:20:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 9600[0m
     | > loss: -0.36174  (-0.43629)
     | > log_mle: -0.52583  (-0.56754)
     | > loss_dur: 0.16409  (0.13125)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.37079  (11.28227)
     | > current_lr: 0.00013 
     | > step_time: 0.63560  (0.66544)
     | > loader_time: 0.41040  (0.41504)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[92m 0.33582 [0m(-0.02812)
     | > avg_log_mle:[91m -0.45356 [0m(+0.00913)
     | > avg_loss_dur:[92m 0.78938 [0m(-0.03725)


[4m[1m > EPOCH: 534/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:21:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 9625[0m
     | > loss: -0.29254  (-0.39045)
     | > log_mle: -0.50456  (-0.54549)
     | > loss_dur: 0.21202  (0.15504)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 48.56676  (16.82363)
     | > current_lr: 0.00013 
     | > step_time: 0.78670  (0.72166)
     | > loader_time: 0.53750  (0.45633)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08007 [0m(+0.01001)
     | > avg_loss:[92m 0.32088 [0m(-0.01494)
     | > avg_log_mle:[92m -0.45675 [0m(-0.00318)
     | > avg_loss_dur:[92m 0.77762 [0m(-0.01176)


[4m[1m > EPOCH: 535/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:21:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.01601)
     | > avg_loss:[91m 0.35161 [0m(+0.03073)
     | > avg_log_mle:[92m -0.46334 [0m(-0.00660)
     | > avg_loss_dur:[91m 0.81495 [0m(+0.03733)


[4m[1m > EPOCH: 536/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:22:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 9650[0m
     | > loss: -0.48938  (-0.49221)
     | > log_mle: -0.59250  (-0.59761)
     | > loss_dur: 0.10313  (0.10541)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.67224  (8.34413)
     | > current_lr: 0.00013 
     | > step_time: 0.55850  (0.60405)
     | > loader_time: 0.36530  (0.36733)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00701)
     | > avg_loss:[92m 0.33469 [0m(-0.01692)
     | > avg_log_mle:[91m -0.46018 [0m(+0.00316)
     | > avg_loss_dur:[92m 0.79487 [0m(-0.02008)


[4m[1m > EPOCH: 537/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:22:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 9675[0m
     | > loss: -0.37304  (-0.41293)
     | > log_mle: -0.54080  (-0.55802)
     | > loss_dur: 0.16777  (0.14509)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.94993  (16.38956)
     | > current_lr: 0.00013 
     | > step_time: 0.86780  (0.68863)
     | > loader_time: 0.56050  (0.41660)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00400)
     | > avg_loss:[91m 0.42674 [0m(+0.09205)
     | > avg_log_mle:[91m -0.44376 [0m(+0.01642)
     | > avg_loss_dur:[91m 0.87050 [0m(+0.07563)


[4m[1m > EPOCH: 538/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:23:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 9700[0m
     | > loss: -0.30587  (-0.37053)
     | > log_mle: -0.49065  (-0.53268)
     | > loss_dur: 0.18478  (0.16215)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.82516  (15.02502)
     | > current_lr: 0.00013 
     | > step_time: 0.95490  (0.76551)
     | > loader_time: 0.62450  (0.47693)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00701)
     | > avg_loss:[92m 0.33783 [0m(-0.08891)
     | > avg_log_mle:[92m -0.45132 [0m(-0.00755)
     | > avg_loss_dur:[92m 0.78915 [0m(-0.08135)


[4m[1m > EPOCH: 539/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:23:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00500)
     | > avg_loss:[92m 0.32032 [0m(-0.01751)
     | > avg_log_mle:[92m -0.45907 [0m(-0.00776)
     | > avg_loss_dur:[92m 0.77939 [0m(-0.00976)


[4m[1m > EPOCH: 540/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:24:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 9725[0m
     | > loss: -0.39537  (-0.44848)
     | > log_mle: -0.55748  (-0.57948)
     | > loss_dur: 0.16211  (0.13100)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.33423  (9.25325)
     | > current_lr: 0.00014 
     | > step_time: 0.74570  (0.67642)
     | > loader_time: 0.46940  (0.42078)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[91m 0.34363 [0m(+0.02331)
     | > avg_log_mle:[91m -0.44402 [0m(+0.01505)
     | > avg_loss_dur:[91m 0.78766 [0m(+0.00826)


[4m[1m > EPOCH: 541/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:24:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 9750[0m
     | > loss: -0.37072  (-0.41248)
     | > log_mle: -0.53556  (-0.55643)
     | > loss_dur: 0.16484  (0.14395)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.96032  (14.68407)
     | > current_lr: 0.00014 
     | > step_time: 0.90880  (0.71432)
     | > loader_time: 0.62860  (0.45232)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06705 [0m(-0.00702)
     | > avg_loss:[91m 0.41939 [0m(+0.07576)
     | > avg_log_mle:[92m -0.45338 [0m(-0.00936)
     | > avg_loss_dur:[91m 0.87277 [0m(+0.08512)


[4m[1m > EPOCH: 542/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:25:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00401)
     | > avg_loss:[92m 0.40480 [0m(-0.01459)
     | > avg_log_mle:[91m -0.44870 [0m(+0.00469)
     | > avg_loss_dur:[92m 0.85349 [0m(-0.01928)


[4m[1m > EPOCH: 543/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:26:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 9775[0m
     | > loss: -0.49127  (-0.49127)
     | > log_mle: -0.59209  (-0.59209)
     | > loss_dur: 0.10082  (0.10082)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.14572  (10.14572)
     | > current_lr: 0.00014 
     | > step_time: 0.65260  (0.65259)
     | > loader_time: 0.36730  (0.36733)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06204 [0m(-0.00902)
     | > avg_loss:[91m 0.41503 [0m(+0.01024)
     | > avg_log_mle:[92m -0.45780 [0m(-0.00911)
     | > avg_loss_dur:[91m 0.87284 [0m(+0.01934)


[4m[1m > EPOCH: 544/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:26:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 9800[0m
     | > loss: -0.41210  (-0.44068)
     | > log_mle: -0.56831  (-0.57504)
     | > loss_dur: 0.15621  (0.13436)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.04783  (13.77474)
     | > current_lr: 0.00014 
     | > step_time: 0.67760  (0.66536)
     | > loader_time: 0.44040  (0.40925)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00802)
     | > avg_loss:[92m 0.37778 [0m(-0.03726)
     | > avg_log_mle:[91m -0.45387 [0m(+0.00393)
     | > avg_loss_dur:[92m 0.83165 [0m(-0.04119)


[4m[1m > EPOCH: 545/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:27:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 9825[0m
     | > loss: -0.31017  (-0.39619)
     | > log_mle: -0.49966  (-0.54614)
     | > loss_dur: 0.18949  (0.14995)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.89206  (16.40115)
     | > current_lr: 0.00014 
     | > step_time: 0.87880  (0.75068)
     | > loader_time: 0.55350  (0.48331)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00601)
     | > avg_loss:[92m 0.35839 [0m(-0.01939)
     | > avg_log_mle:[91m -0.45371 [0m(+0.00016)
     | > avg_loss_dur:[92m 0.81210 [0m(-0.01955)


[4m[1m > EPOCH: 546/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:27:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.01001)
     | > avg_loss:[91m 0.38432 [0m(+0.02593)
     | > avg_log_mle:[91m -0.45185 [0m(+0.00186)
     | > avg_loss_dur:[91m 0.83617 [0m(+0.02407)


[4m[1m > EPOCH: 547/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:28:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 9850[0m
     | > loss: -0.40182  (-0.46450)
     | > log_mle: -0.55419  (-0.58335)
     | > loss_dur: 0.15237  (0.11885)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.68513  (13.06310)
     | > current_lr: 0.00014 
     | > step_time: 0.73270  (0.65760)
     | > loader_time: 0.50450  (0.41538)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00701)
     | > avg_loss:[91m 0.38560 [0m(+0.00128)
     | > avg_log_mle:[92m -0.45906 [0m(-0.00721)
     | > avg_loss_dur:[91m 0.84466 [0m(+0.00850)


[4m[1m > EPOCH: 548/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:28:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 9875[0m
     | > loss: -0.38985  (-0.42589)
     | > log_mle: -0.54063  (-0.56548)
     | > loss_dur: 0.15078  (0.13959)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 26.41311  (13.39559)
     | > current_lr: 0.00014 
     | > step_time: 0.73870  (0.69682)
     | > loader_time: 0.48340  (0.45796)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00601)
     | > avg_loss:[91m 0.48797 [0m(+0.10236)
     | > avg_log_mle:[91m -0.44211 [0m(+0.01695)
     | > avg_loss_dur:[91m 0.93007 [0m(+0.08541)


[4m[1m > EPOCH: 549/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:29:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.01001)
     | > avg_loss:[92m 0.42309 [0m(-0.06488)
     | > avg_log_mle:[92m -0.45168 [0m(-0.00957)
     | > avg_loss_dur:[92m 0.87477 [0m(-0.05531)


[4m[1m > EPOCH: 550/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:29:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 9900[0m
     | > loss: -0.49691  (-0.49691)
     | > log_mle: -0.59783  (-0.59783)
     | > loss_dur: 0.10092  (0.10092)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.66849  (21.66849)
     | > current_lr: 0.00014 
     | > step_time: 0.49950  (0.49945)
     | > loader_time: 0.27920  (0.27924)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07507 [0m(-0.00200)
     | > avg_loss:[91m 0.43457 [0m(+0.01148)
     | > avg_log_mle:[92m -0.46491 [0m(-0.01323)
     | > avg_loss_dur:[91m 0.89948 [0m(+0.02471)


[4m[1m > EPOCH: 551/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:30:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 9925[0m
     | > loss: -0.39590  (-0.45897)
     | > log_mle: -0.55361  (-0.58266)
     | > loss_dur: 0.15771  (0.12369)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.84411  (15.30768)
     | > current_lr: 0.00014 
     | > step_time: 0.65360  (0.66732)
     | > loader_time: 0.41940  (0.41466)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00400)
     | > avg_loss:[92m 0.36324 [0m(-0.07133)
     | > avg_log_mle:[91m -0.44809 [0m(+0.01681)
     | > avg_loss_dur:[92m 0.81133 [0m(-0.08814)


[4m[1m > EPOCH: 552/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:30:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 9950[0m
     | > loss: -0.35421  (-0.41724)
     | > log_mle: -0.51595  (-0.55851)
     | > loss_dur: 0.16174  (0.14127)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.30693  (12.98222)
     | > current_lr: 0.00014 
     | > step_time: 1.02690  (0.74203)
     | > loader_time: 0.67160  (0.50281)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00100)
     | > avg_loss:[91m 0.37275 [0m(+0.00951)
     | > avg_log_mle:[92m -0.46367 [0m(-0.01557)
     | > avg_loss_dur:[91m 0.83641 [0m(+0.02508)


[4m[1m > EPOCH: 553/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:31:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[91m 0.39456 [0m(+0.02181)
     | > avg_log_mle:[91m -0.44470 [0m(+0.01896)
     | > avg_loss_dur:[91m 0.83926 [0m(+0.00285)


[4m[1m > EPOCH: 554/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:31:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 9975[0m
     | > loss: -0.46328  (-0.49427)
     | > log_mle: -0.57953  (-0.59464)
     | > loss_dur: 0.11625  (0.10037)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.22422  (10.86056)
     | > current_lr: 0.00014 
     | > step_time: 0.68460  (0.63291)
     | > loader_time: 0.42840  (0.37034)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00200)
     | > avg_loss:[91m 0.40768 [0m(+0.01312)
     | > avg_log_mle:[91m -0.44428 [0m(+0.00042)
     | > avg_loss_dur:[91m 0.85197 [0m(+0.01271)


[4m[1m > EPOCH: 555/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:32:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 10000[0m
     | > loss: -0.39031  (-0.43021)
     | > log_mle: -0.53156  (-0.56361)
     | > loss_dur: 0.14125  (0.13340)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.04455  (15.32948)
     | > current_lr: 0.00014 
     | > step_time: 0.69960  (0.69413)
     | > loader_time: 0.48540  (0.44390)


 > CHECKPOINT : ./output\run-September-15-2022_04+45AM-910d77a\checkpoint_10000.pth

[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00901)
     | > avg_loss:[92m 0.35983 [0m(-0.04786)
     | > avg_log_mle:[92m -0.46107 [0m(-0.01678)
     | > avg_loss_dur:[92m 0.82089 [0m(-0.03108)


[4m[1m > EPOCH: 556/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:32:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 10025[0m
     | > loss: -0.38411  (-0.41375)
     | > log_mle: -0.53284  (-0.55664)
     | > loss_dur: 0.14873  (0.14289)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.25480  (15.09970)
     | > current_lr: 0.00014 
     | > step_time: 0.85080  (0.77035)
     | > loader_time: 0.44540  (0.47708)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00100)
     | > avg_loss:[91m 0.38961 [0m(+0.02978)
     | > avg_log_mle:[91m -0.45272 [0m(+0.00835)
     | > avg_loss_dur:[91m 0.84232 [0m(+0.02143)


[4m[1m > EPOCH: 557/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:33:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.01401)
     | > avg_loss:[92m 0.38021 [0m(-0.00940)
     | > avg_log_mle:[92m -0.46289 [0m(-0.01017)
     | > avg_loss_dur:[91m 0.84310 [0m(+0.00078)


[4m[1m > EPOCH: 558/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:33:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 10050[0m
     | > loss: -0.41538  (-0.47774)
     | > log_mle: -0.55499  (-0.59107)
     | > loss_dur: 0.13962  (0.11333)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.54182  (15.81021)
     | > current_lr: 0.00014 
     | > step_time: 0.63960  (0.67044)
     | > loader_time: 0.38130  (0.40186)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00601)
     | > avg_loss:[91m 0.38523 [0m(+0.00501)
     | > avg_log_mle:[91m -0.44672 [0m(+0.01617)
     | > avg_loss_dur:[92m 0.83195 [0m(-0.01116)


[4m[1m > EPOCH: 559/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:34:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 10075[0m
     | > loss: -0.32545  (-0.42669)
     | > log_mle: -0.51920  (-0.56669)
     | > loss_dur: 0.19374  (0.14001)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.25262  (17.79579)
     | > current_lr: 0.00014 
     | > step_time: 0.78570  (0.72178)
     | > loader_time: 0.48940  (0.45372)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[92m 0.36935 [0m(-0.01588)
     | > avg_log_mle:[92m -0.45772 [0m(-0.01100)
     | > avg_loss_dur:[92m 0.82706 [0m(-0.00488)


[4m[1m > EPOCH: 560/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:35:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00500)
     | > avg_loss:[91m 0.43139 [0m(+0.06204)
     | > avg_log_mle:[91m -0.43989 [0m(+0.01783)
     | > avg_loss_dur:[91m 0.87128 [0m(+0.04421)


[4m[1m > EPOCH: 561/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:35:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 10100[0m
     | > loss: -0.50925  (-0.51618)
     | > log_mle: -0.60376  (-0.60587)
     | > loss_dur: 0.09451  (0.08969)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.32275  (13.27240)
     | > current_lr: 0.00014 
     | > step_time: 0.55850  (0.60505)
     | > loader_time: 0.32530  (0.36083)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00400)
     | > avg_loss:[91m 0.43726 [0m(+0.00587)
     | > avg_log_mle:[92m -0.44961 [0m(-0.00972)
     | > avg_loss_dur:[91m 0.88687 [0m(+0.01559)


[4m[1m > EPOCH: 562/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:36:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 10125[0m
     | > loss: -0.43395  (-0.45495)
     | > log_mle: -0.57410  (-0.58077)
     | > loss_dur: 0.14015  (0.12581)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 15.50457  (18.23310)
     | > current_lr: 0.00014 
     | > step_time: 0.87380  (0.69029)
     | > loader_time: 0.60860  (0.42572)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[92m 0.36493 [0m(-0.07233)
     | > avg_log_mle:[92m -0.46390 [0m(-0.01429)
     | > avg_loss_dur:[92m 0.82883 [0m(-0.05803)


[4m[1m > EPOCH: 563/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:36:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 10150[0m
     | > loss: -0.37883  (-0.43003)
     | > log_mle: -0.52820  (-0.56622)
     | > loss_dur: 0.14937  (0.13619)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.12722  (11.70739)
     | > current_lr: 0.00014 
     | > step_time: 0.94890  (0.76245)
     | > loader_time: 0.62360  (0.49044)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00200)
     | > avg_loss:[91m 0.38617 [0m(+0.02124)
     | > avg_log_mle:[91m -0.45678 [0m(+0.00712)
     | > avg_loss_dur:[91m 0.84296 [0m(+0.01412)


[4m[1m > EPOCH: 564/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:37:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.01001)
     | > avg_loss:[91m 0.39289 [0m(+0.00672)
     | > avg_log_mle:[92m -0.46068 [0m(-0.00390)
     | > avg_loss_dur:[91m 0.85358 [0m(+0.01062)


[4m[1m > EPOCH: 565/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:37:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 10175[0m
     | > loss: -0.43105  (-0.48779)
     | > log_mle: -0.57236  (-0.59777)
     | > loss_dur: 0.14131  (0.10998)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 20.51315  (12.46698)
     | > current_lr: 0.00014 
     | > step_time: 0.74170  (0.67481)
     | > loader_time: 0.47340  (0.42479)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06406 [0m(+0.00300)
     | > avg_loss:[92m 0.37813 [0m(-0.01476)
     | > avg_log_mle:[91m -0.45776 [0m(+0.00292)
     | > avg_loss_dur:[92m 0.83590 [0m(-0.01768)


[4m[1m > EPOCH: 566/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:38:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 10200[0m
     | > loss: -0.40154  (-0.44831)
     | > log_mle: -0.55051  (-0.57785)
     | > loss_dur: 0.14897  (0.12954)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 14.59382  (16.62741)
     | > current_lr: 0.00014 
     | > step_time: 0.91280  (0.71598)
     | > loader_time: 0.72070  (0.46267)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06506 [0m(+0.00100)
     | > avg_loss:[91m 0.41769 [0m(+0.03956)
     | > avg_log_mle:[92m -0.46346 [0m(-0.00569)
     | > avg_loss_dur:[91m 0.88115 [0m(+0.04525)


[4m[1m > EPOCH: 567/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:38:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00400)
     | > avg_loss:[92m 0.38906 [0m(-0.02863)
     | > avg_log_mle:[91m -0.45775 [0m(+0.00571)
     | > avg_loss_dur:[92m 0.84681 [0m(-0.03434)


[4m[1m > EPOCH: 568/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:39:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 10225[0m
     | > loss: -0.53651  (-0.53651)
     | > log_mle: -0.62630  (-0.62630)
     | > loss_dur: 0.08979  (0.08979)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.80322  (7.80322)
     | > current_lr: 0.00014 
     | > step_time: 0.65060  (0.65059)
     | > loader_time: 0.34730  (0.34732)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00300)
     | > avg_loss:[91m 0.40802 [0m(+0.01896)
     | > avg_log_mle:[92m -0.46138 [0m(-0.00363)
     | > avg_loss_dur:[91m 0.86939 [0m(+0.02258)


[4m[1m > EPOCH: 569/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:39:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 10250[0m
     | > loss: -0.40761  (-0.46425)
     | > log_mle: -0.57106  (-0.58922)
     | > loss_dur: 0.16344  (0.12497)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.80792  (11.28079)
     | > current_lr: 0.00014 
     | > step_time: 0.68060  (0.66898)
     | > loader_time: 0.45140  (0.41488)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00200)
     | > avg_loss:[91m 0.54678 [0m(+0.13877)
     | > avg_log_mle:[91m -0.45863 [0m(+0.00275)
     | > avg_loss_dur:[91m 1.00541 [0m(+0.13602)


[4m[1m > EPOCH: 570/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:40:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 10275[0m
     | > loss: -0.34646  (-0.42565)
     | > log_mle: -0.52487  (-0.56479)
     | > loss_dur: 0.17842  (0.13914)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.02202  (12.74519)
     | > current_lr: 0.00014 
     | > step_time: 0.87980  (0.75069)
     | > loader_time: 0.53750  (0.47363)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00801)
     | > avg_loss:[92m 0.41095 [0m(-0.13583)
     | > avg_log_mle:[91m -0.42883 [0m(+0.02980)
     | > avg_loss_dur:[92m 0.83979 [0m(-0.16563)


[4m[1m > EPOCH: 571/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:40:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.01001)
     | > avg_loss:[91m 0.41622 [0m(+0.00527)
     | > avg_log_mle:[92m -0.45994 [0m(-0.03111)
     | > avg_loss_dur:[91m 0.87616 [0m(+0.03638)


[4m[1m > EPOCH: 572/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:41:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 10300[0m
     | > loss: -0.47258  (-0.50518)
     | > log_mle: -0.59426  (-0.60676)
     | > loss_dur: 0.12168  (0.10158)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 4.33073  (6.28549)
     | > current_lr: 0.00014 
     | > step_time: 0.72070  (0.65284)
     | > loader_time: 0.47640  (0.40212)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.01001)
     | > avg_loss:[91m 0.45611 [0m(+0.03989)
     | > avg_log_mle:[91m -0.40400 [0m(+0.05594)
     | > avg_loss_dur:[92m 0.86011 [0m(-0.01605)


[4m[1m > EPOCH: 573/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:41:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 10325[0m
     | > loss: -0.39976  (-0.41624)
     | > log_mle: -0.54527  (-0.55363)
     | > loss_dur: 0.14552  (0.13740)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.66128  (8.82717)
     | > current_lr: 0.00014 
     | > step_time: 0.73070  (0.69500)
     | > loader_time: 0.46340  (0.42830)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00901)
     | > avg_loss:[92m 0.41826 [0m(-0.03785)
     | > avg_log_mle:[92m -0.44700 [0m(-0.04300)
     | > avg_loss_dur:[91m 0.86526 [0m(+0.00516)


[4m[1m > EPOCH: 574/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:42:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.01001)
     | > avg_loss:[91m 0.43704 [0m(+0.01878)
     | > avg_log_mle:[91m -0.44671 [0m(+0.00030)
     | > avg_loss_dur:[91m 0.88375 [0m(+0.01849)


[4m[1m > EPOCH: 575/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:42:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 10350[0m
     | > loss: -0.50906  (-0.50906)
     | > log_mle: -0.61163  (-0.61163)
     | > loss_dur: 0.10257  (0.10257)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.25998  (11.25998)
     | > current_lr: 0.00014 
     | > step_time: 0.61760  (0.61756)
     | > loader_time: 0.26320  (0.26324)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00701)
     | > avg_loss:[92m 0.38715 [0m(-0.04989)
     | > avg_log_mle:[92m -0.45990 [0m(-0.01319)
     | > avg_loss_dur:[92m 0.84705 [0m(-0.03670)


[4m[1m > EPOCH: 576/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:43:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 10375[0m
     | > loss: -0.43998  (-0.47965)
     | > log_mle: -0.57690  (-0.59673)
     | > loss_dur: 0.13692  (0.11708)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 36.74333  (13.16480)
     | > current_lr: 0.00014 
     | > step_time: 0.64960  (0.66689)
     | > loader_time: 0.39940  (0.41323)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00100)
     | > avg_loss:[91m 0.44560 [0m(+0.05845)
     | > avg_log_mle:[91m -0.42728 [0m(+0.03262)
     | > avg_loss_dur:[91m 0.87288 [0m(+0.02583)


[4m[1m > EPOCH: 577/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:43:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 10400[0m
     | > loss: -0.34830  (-0.42067)
     | > log_mle: -0.51894  (-0.55837)
     | > loss_dur: 0.17064  (0.13770)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.64013  (9.74381)
     | > current_lr: 0.00014 
     | > step_time: 1.02890  (0.74110)
     | > loader_time: 0.60050  (0.48208)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00000)
     | > avg_loss:[92m 0.38730 [0m(-0.05830)
     | > avg_log_mle:[92m -0.45667 [0m(-0.02940)
     | > avg_loss_dur:[92m 0.84397 [0m(-0.02890)


[4m[1m > EPOCH: 578/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:44:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00500)
     | > avg_loss:[91m 0.40769 [0m(+0.02039)
     | > avg_log_mle:[92m -0.45895 [0m(-0.00228)
     | > avg_loss_dur:[91m 0.86664 [0m(+0.02267)


[4m[1m > EPOCH: 579/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:45:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 10425[0m
     | > loss: -0.50756  (-0.51640)
     | > log_mle: -0.61689  (-0.61654)
     | > loss_dur: 0.10933  (0.10013)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 6.74451  (9.43985)
     | > current_lr: 0.00014 
     | > step_time: 0.69060  (0.63591)
     | > loader_time: 0.42240  (0.38301)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00701)
     | > avg_loss:[92m 0.39038 [0m(-0.01731)
     | > avg_log_mle:[92m -0.45978 [0m(-0.00083)
     | > avg_loss_dur:[92m 0.85016 [0m(-0.01648)


[4m[1m > EPOCH: 580/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:45:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 10450[0m
     | > loss: -0.42542  (-0.46517)
     | > log_mle: -0.55760  (-0.58758)
     | > loss_dur: 0.13219  (0.12241)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.23512  (11.81002)
     | > current_lr: 0.00015 
     | > step_time: 0.70060  (0.69224)
     | > loader_time: 0.43540  (0.43249)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06805 [0m(-0.00101)
     | > avg_loss:[91m 0.41245 [0m(+0.02207)
     | > avg_log_mle:[91m -0.45591 [0m(+0.00387)
     | > avg_loss_dur:[91m 0.86836 [0m(+0.01819)


[4m[1m > EPOCH: 581/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:46:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 10475[0m
     | > loss: -0.39143  (-0.43581)
     | > log_mle: -0.53275  (-0.56806)
     | > loss_dur: 0.14132  (0.13225)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 26.03977  (15.28391)
     | > current_lr: 0.00015 
     | > step_time: 0.85080  (0.76821)
     | > loader_time: 0.43440  (0.47513)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00101)
     | > avg_loss:[92m 0.39660 [0m(-0.01585)
     | > avg_log_mle:[91m -0.45500 [0m(+0.00091)
     | > avg_loss_dur:[92m 0.85160 [0m(-0.01676)


[4m[1m > EPOCH: 582/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:46:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[91m 0.41923 [0m(+0.02263)
     | > avg_log_mle:[91m -0.44880 [0m(+0.00620)
     | > avg_loss_dur:[91m 0.86802 [0m(+0.01643)


[4m[1m > EPOCH: 583/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:47:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 10500[0m
     | > loss: -0.39270  (-0.47504)
     | > log_mle: -0.54955  (-0.59122)
     | > loss_dur: 0.15685  (0.11618)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 15.40290  (16.24054)
     | > current_lr: 0.00015 
     | > step_time: 0.63660  (0.66661)
     | > loader_time: 0.38640  (0.40337)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00100)
     | > avg_loss:[91m 0.42423 [0m(+0.00500)
     | > avg_log_mle:[91m -0.44386 [0m(+0.00494)
     | > avg_loss_dur:[91m 0.86809 [0m(+0.00006)


[4m[1m > EPOCH: 584/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 09:47:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 10525[0m
     | > loss: -0.36909  (-0.43933)
     | > log_mle: -0.53059  (-0.57321)
     | > loss_dur: 0.16151  (0.13388)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.04310  (12.15664)
     | > current_lr: 0.00015 
     | > step_time: 6232.22960  (480.06811)
     | > loader_time: 0.55350  (0.46311)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.09609 [0m(+0.02803)
     | > avg_loss:[92m 0.37889 [0m(-0.04534)
     | > avg_log_mle:[92m -0.45564 [0m(-0.01178)
     | > avg_loss_dur:[92m 0.83453 [0m(-0.03356)


[4m[1m > EPOCH: 585/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:32:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.02903)
     | > avg_loss:[91m 0.40740 [0m(+0.02851)
     | > avg_log_mle:[92m -0.45618 [0m(-0.00054)
     | > avg_loss_dur:[91m 0.86358 [0m(+0.02905)


[4m[1m > EPOCH: 586/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:32:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 10550[0m
     | > loss: -0.53130  (-0.52891)
     | > log_mle: -0.62191  (-0.62111)
     | > loss_dur: 0.09061  (0.09220)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 14.29017  (11.10175)
     | > current_lr: 0.00015 
     | > step_time: 0.55650  (0.60055)
     | > loader_time: 0.33430  (0.34481)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00300)
     | > avg_loss:[92m 0.38233 [0m(-0.02507)
     | > avg_log_mle:[92m -0.45756 [0m(-0.00138)
     | > avg_loss_dur:[92m 0.83988 [0m(-0.02370)


[4m[1m > EPOCH: 587/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:33:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 10575[0m
     | > loss: -0.43256  (-0.47463)
     | > log_mle: -0.57637  (-0.59737)
     | > loss_dur: 0.14381  (0.12275)
     | > amp_scaler: 8192.00000  (15473.77778)
     | > grad_norm: 0.00000  (12.80151)
     | > current_lr: 0.00015 
     | > step_time: 0.81870  (0.68262)
     | > loader_time: 0.55150  (0.42183)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01201)
     | > avg_loss:[91m 0.41693 [0m(+0.03460)
     | > avg_log_mle:[91m -0.44979 [0m(+0.00777)
     | > avg_loss_dur:[91m 0.86672 [0m(+0.02683)


[4m[1m > EPOCH: 588/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:33:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 10600[0m
     | > loss: -0.37088  (-0.44444)
     | > log_mle: -0.52427  (-0.57520)
     | > loss_dur: 0.15339  (0.13076)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 34.24551  (16.35525)
     | > current_lr: 0.00015 
     | > step_time: 0.93690  (0.75581)
     | > loader_time: 0.55850  (0.50502)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00801)
     | > avg_loss:[92m 0.41681 [0m(-0.00012)
     | > avg_log_mle:[91m -0.44698 [0m(+0.00281)
     | > avg_loss_dur:[92m 0.86379 [0m(-0.00293)


[4m[1m > EPOCH: 589/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:34:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00600)
     | > avg_loss:[91m 0.41742 [0m(+0.00061)
     | > avg_log_mle:[92m -0.45319 [0m(-0.00621)
     | > avg_loss_dur:[91m 0.87060 [0m(+0.00682)


[4m[1m > EPOCH: 590/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:34:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 10625[0m
     | > loss: -0.45525  (-0.51812)
     | > log_mle: -0.58220  (-0.61729)
     | > loss_dur: 0.12695  (0.09918)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 32.84970  (14.07051)
     | > current_lr: 0.00015 
     | > step_time: 0.73570  (0.67121)
     | > loader_time: 0.44940  (0.42899)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06005 [0m(-0.01401)
     | > avg_loss:[92m 0.36715 [0m(-0.05027)
     | > avg_log_mle:[92m -0.45449 [0m(-0.00131)
     | > avg_loss_dur:[92m 0.82165 [0m(-0.04896)


[4m[1m > EPOCH: 591/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:35:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 10650[0m
     | > loss: -0.40780  (-0.46386)
     | > log_mle: -0.55531  (-0.58509)
     | > loss_dur: 0.14751  (0.12123)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.90118  (16.42446)
     | > current_lr: 0.00015 
     | > step_time: 0.91080  (0.71081)
     | > loader_time: 0.61860  (0.45299)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06406 [0m(+0.00400)
     | > avg_loss:[91m 0.41857 [0m(+0.05142)
     | > avg_log_mle:[91m -0.45436 [0m(+0.00014)
     | > avg_loss_dur:[91m 0.87292 [0m(+0.05128)


[4m[1m > EPOCH: 592/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:35:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01001)
     | > avg_loss:[92m 0.40701 [0m(-0.01156)
     | > avg_log_mle:[91m -0.44261 [0m(+0.01175)
     | > avg_loss_dur:[92m 0.84962 [0m(-0.02331)


[4m[1m > EPOCH: 593/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:36:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 10675[0m
     | > loss: -0.52752  (-0.52752)
     | > log_mle: -0.61262  (-0.61262)
     | > loss_dur: 0.08511  (0.08511)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.00023  (18.00023)
     | > current_lr: 0.00015 
     | > step_time: 0.64960  (0.64959)
     | > loader_time: 0.35830  (0.35832)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07407 [0m(+0.00000)
     | > avg_loss:[91m 0.42668 [0m(+0.01967)
     | > avg_log_mle:[92m -0.45037 [0m(-0.00776)
     | > avg_loss_dur:[91m 0.87705 [0m(+0.02743)


[4m[1m > EPOCH: 594/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:36:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 10700[0m
     | > loss: -0.43854  (-0.48098)
     | > log_mle: -0.57946  (-0.59751)
     | > loss_dur: 0.14092  (0.11653)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.50370  (13.78403)
     | > current_lr: 0.00015 
     | > step_time: 0.67560  (0.66335)
     | > loader_time: 0.44740  (0.40750)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00901)
     | > avg_loss:[92m 0.37651 [0m(-0.05017)
     | > avg_log_mle:[91m -0.43445 [0m(+0.01592)
     | > avg_loss_dur:[92m 0.81096 [0m(-0.06609)


[4m[1m > EPOCH: 595/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:37:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 10725[0m
     | > loss: -0.35982  (-0.43770)
     | > log_mle: -0.51934  (-0.56858)
     | > loss_dur: 0.15952  (0.13088)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.05250  (23.36025)
     | > current_lr: 0.00015 
     | > step_time: 0.87380  (0.74968)
     | > loader_time: 0.54250  (0.47009)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.01201)
     | > avg_loss:[91m 0.44473 [0m(+0.06823)
     | > avg_log_mle:[92m -0.43836 [0m(-0.00391)
     | > avg_loss_dur:[91m 0.88310 [0m(+0.07214)


[4m[1m > EPOCH: 596/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:37:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.01201)
     | > avg_loss:[92m 0.40131 [0m(-0.04342)
     | > avg_log_mle:[92m -0.45382 [0m(-0.01546)
     | > avg_loss_dur:[92m 0.85513 [0m(-0.02797)


[4m[1m > EPOCH: 597/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:38:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 10750[0m
     | > loss: -0.49606  (-0.50981)
     | > log_mle: -0.60479  (-0.61271)
     | > loss_dur: 0.10873  (0.10290)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.58232  (13.78563)
     | > current_lr: 0.00015 
     | > step_time: 0.72870  (0.65735)
     | > loader_time: 0.46440  (0.39611)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00601)
     | > avg_loss:[92m 0.34917 [0m(-0.05214)
     | > avg_log_mle:[91m -0.44950 [0m(+0.00432)
     | > avg_loss_dur:[92m 0.79867 [0m(-0.05646)


[4m[1m > EPOCH: 598/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:38:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 10775[0m
     | > loss: -0.43954  (-0.45626)
     | > log_mle: -0.56959  (-0.58296)
     | > loss_dur: 0.13004  (0.12670)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.09862  (14.97523)
     | > current_lr: 0.00015 
     | > step_time: 0.83480  (0.70328)
     | > loader_time: 0.55350  (0.44713)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00400)
     | > avg_loss:[91m 0.36688 [0m(+0.01771)
     | > avg_log_mle:[91m -0.44009 [0m(+0.00941)
     | > avg_loss_dur:[91m 0.80696 [0m(+0.00830)


[4m[1m > EPOCH: 599/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:39:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.01401)
     | > avg_loss:[91m 0.38026 [0m(+0.01339)
     | > avg_log_mle:[92m -0.45163 [0m(-0.01154)
     | > avg_loss_dur:[91m 0.83189 [0m(+0.02493)


[4m[1m > EPOCH: 600/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:39:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 10800[0m
     | > loss: -0.54856  (-0.54856)
     | > log_mle: -0.63342  (-0.63342)
     | > loss_dur: 0.08486  (0.08486)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.31493  (20.31493)
     | > current_lr: 0.00015 
     | > step_time: 0.65160  (0.65159)
     | > loader_time: 0.25720  (0.25723)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06206 [0m(+0.00100)
     | > avg_loss:[91m 0.38546 [0m(+0.00520)
     | > avg_log_mle:[92m -0.45782 [0m(-0.00620)
     | > avg_loss_dur:[91m 0.84328 [0m(+0.01139)


[4m[1m > EPOCH: 601/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:40:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 10825[0m
     | > loss: -0.42222  (-0.47341)
     | > log_mle: -0.56342  (-0.59225)
     | > loss_dur: 0.14119  (0.11884)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.96037  (23.26882)
     | > current_lr: 0.00015 
     | > step_time: 0.65260  (0.66889)
     | > loader_time: 0.41840  (0.44984)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00500)
     | > avg_loss:[91m 0.43235 [0m(+0.04689)
     | > avg_log_mle:[91m -0.43873 [0m(+0.01909)
     | > avg_loss_dur:[91m 0.87108 [0m(+0.02780)


[4m[1m > EPOCH: 602/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:40:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 10850[0m
     | > loss: -0.39191  (-0.45683)
     | > log_mle: -0.53978  (-0.58403)
     | > loss_dur: 0.14786  (0.12720)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.01462  (14.63014)
     | > current_lr: 0.00015 
     | > step_time: 1.02190  (0.74582)
     | > loader_time: 0.61060  (0.46335)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00100)
     | > avg_loss:[92m 0.38498 [0m(-0.04738)
     | > avg_log_mle:[92m -0.45754 [0m(-0.01880)
     | > avg_loss_dur:[92m 0.84251 [0m(-0.02857)


[4m[1m > EPOCH: 603/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:41:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 0.38358 [0m(-0.00140)
     | > avg_log_mle:[91m -0.45040 [0m(+0.00714)
     | > avg_loss_dur:[92m 0.83397 [0m(-0.00854)


[4m[1m > EPOCH: 604/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:41:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 10875[0m
     | > loss: -0.50491  (-0.53037)
     | > log_mle: -0.61789  (-0.62678)
     | > loss_dur: 0.11298  (0.09641)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.02746  (9.12608)
     | > current_lr: 0.00015 
     | > step_time: 0.69060  (0.64192)
     | > loader_time: 0.40240  (0.38068)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00601)
     | > avg_loss:[92m 0.33456 [0m(-0.04902)
     | > avg_log_mle:[92m -0.45044 [0m(-0.00004)
     | > avg_loss_dur:[92m 0.78499 [0m(-0.04898)


[4m[1m > EPOCH: 605/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:42:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 10900[0m
     | > loss: -0.45378  (-0.48582)
     | > log_mle: -0.57053  (-0.60180)
     | > loss_dur: 0.11675  (0.11599)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.09651  (10.35075)
     | > current_lr: 0.00015 
     | > step_time: 0.70560  (0.69473)
     | > loader_time: 0.47340  (0.46602)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00400)
     | > avg_loss:[91m 0.39754 [0m(+0.06298)
     | > avg_log_mle:[92m -0.45281 [0m(-0.00238)
     | > avg_loss_dur:[91m 0.85035 [0m(+0.06536)


[4m[1m > EPOCH: 606/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:42:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 10925[0m
     | > loss: -0.40497  (-0.45756)
     | > log_mle: -0.54481  (-0.58255)
     | > loss_dur: 0.13984  (0.12499)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.42877  (19.35627)
     | > current_lr: 0.00015 
     | > step_time: 0.85380  (0.77559)
     | > loader_time: 0.44440  (0.48409)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00100)
     | > avg_loss:[91m 0.40191 [0m(+0.00437)
     | > avg_log_mle:[91m -0.45118 [0m(+0.00163)
     | > avg_loss_dur:[91m 0.85309 [0m(+0.00273)


[4m[1m > EPOCH: 607/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:43:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[91m 0.41023 [0m(+0.00832)
     | > avg_log_mle:[91m -0.43803 [0m(+0.01315)
     | > avg_loss_dur:[92m 0.84825 [0m(-0.00483)


[4m[1m > EPOCH: 608/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:44:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 10950[0m
     | > loss: -0.44820  (-0.50049)
     | > log_mle: -0.57306  (-0.60926)
     | > loss_dur: 0.12486  (0.10877)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.87867  (17.30431)
     | > current_lr: 0.00015 
     | > step_time: 0.64360  (0.67378)
     | > loader_time: 0.37830  (0.42072)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00100)
     | > avg_loss:[92m 0.39593 [0m(-0.01429)
     | > avg_log_mle:[92m -0.44876 [0m(-0.01074)
     | > avg_loss_dur:[92m 0.84470 [0m(-0.00356)


[4m[1m > EPOCH: 609/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:44:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 10975[0m
     | > loss: -0.40503  (-0.46839)
     | > log_mle: -0.55088  (-0.59002)
     | > loss_dur: 0.14585  (0.12164)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.31245  (17.48175)
     | > current_lr: 0.00015 
     | > step_time: 0.78670  (0.72404)
     | > loader_time: 0.51350  (0.50153)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00400)
     | > avg_loss:[92m 0.38842 [0m(-0.00751)
     | > avg_log_mle:[91m -0.44743 [0m(+0.00133)
     | > avg_loss_dur:[92m 0.83585 [0m(-0.00885)


[4m[1m > EPOCH: 610/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:45:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00601)
     | > avg_loss:[91m 0.41330 [0m(+0.02488)
     | > avg_log_mle:[92m -0.44899 [0m(-0.00156)
     | > avg_loss_dur:[91m 0.86229 [0m(+0.02644)


[4m[1m > EPOCH: 611/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:45:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 11000[0m
     | > loss: -0.55212  (-0.54719)
     | > log_mle: -0.64354  (-0.63874)
     | > loss_dur: 0.09141  (0.09156)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 24.68848  (18.61081)
     | > current_lr: 0.00015 
     | > step_time: 0.56650  (0.61056)
     | > loader_time: 0.35130  (0.35732)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.01001)
     | > avg_loss:[91m 0.43138 [0m(+0.01808)
     | > avg_log_mle:[92m -0.45188 [0m(-0.00289)
     | > avg_loss_dur:[91m 0.88326 [0m(+0.02097)


[4m[1m > EPOCH: 612/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:46:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 11025[0m
     | > loss: -0.46888  (-0.49680)
     | > log_mle: -0.59445  (-0.60758)
     | > loss_dur: 0.12557  (0.11078)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.37065  (14.59473)
     | > current_lr: 0.00015 
     | > step_time: 0.88180  (0.69552)
     | > loader_time: 0.58450  (0.42294)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00701)
     | > avg_loss:[92m 0.42368 [0m(-0.00770)
     | > avg_log_mle:[91m -0.43697 [0m(+0.01491)
     | > avg_loss_dur:[92m 0.86066 [0m(-0.02261)


[4m[1m > EPOCH: 613/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:46:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 11050[0m
     | > loss: -0.38807  (-0.46191)
     | > log_mle: -0.53768  (-0.58517)
     | > loss_dur: 0.14960  (0.12326)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.05717  (14.04192)
     | > current_lr: 0.00015 
     | > step_time: 0.95690  (0.77001)
     | > loader_time: 0.60450  (0.48738)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00701)
     | > avg_loss:[92m 0.39679 [0m(-0.02690)
     | > avg_log_mle:[92m -0.45066 [0m(-0.01369)
     | > avg_loss_dur:[92m 0.84745 [0m(-0.01321)


[4m[1m > EPOCH: 614/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:47:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00701)
     | > avg_loss:[92m 0.35157 [0m(-0.04522)
     | > avg_log_mle:[91m -0.44504 [0m(+0.00563)
     | > avg_loss_dur:[92m 0.79661 [0m(-0.05084)


[4m[1m > EPOCH: 615/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:47:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 11075[0m
     | > loss: -0.48060  (-0.53218)
     | > log_mle: -0.59985  (-0.62997)
     | > loss_dur: 0.11925  (0.09779)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 24.24140  (15.05595)
     | > current_lr: 0.00015 
     | > step_time: 0.75070  (0.68202)
     | > loader_time: 0.47340  (0.43519)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00500)
     | > avg_loss:[91m 0.39500 [0m(+0.04342)
     | > avg_log_mle:[92m -0.45036 [0m(-0.00532)
     | > avg_loss_dur:[91m 0.84535 [0m(+0.04875)


[4m[1m > EPOCH: 616/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:48:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 11100[0m
     | > loss: -0.40873  (-0.48345)
     | > log_mle: -0.55993  (-0.60113)
     | > loss_dur: 0.15121  (0.11768)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.17139  (16.97648)
     | > current_lr: 0.00015 
     | > step_time: 0.92080  (0.71965)
     | > loader_time: 0.68560  (0.47185)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06005 [0m(-0.01001)
     | > avg_loss:[92m 0.37238 [0m(-0.02261)
     | > avg_log_mle:[91m -0.43638 [0m(+0.01398)
     | > avg_loss_dur:[92m 0.80876 [0m(-0.03659)


[4m[1m > EPOCH: 617/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:48:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.01001)
     | > avg_loss:[91m 0.40501 [0m(+0.03262)
     | > avg_log_mle:[92m -0.43863 [0m(-0.00226)
     | > avg_loss_dur:[91m 0.84364 [0m(+0.03488)


[4m[1m > EPOCH: 618/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:49:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 11125[0m
     | > loss: -0.55314  (-0.55314)
     | > log_mle: -0.63808  (-0.63808)
     | > loss_dur: 0.08494  (0.08494)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.27678  (12.27678)
     | > current_lr: 0.00015 
     | > step_time: 0.65860  (0.65860)
     | > loader_time: 0.37630  (0.37634)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.00901)
     | > avg_loss:[91m 0.40555 [0m(+0.00054)
     | > avg_log_mle:[92m -0.43994 [0m(-0.00130)
     | > avg_loss_dur:[91m 0.84549 [0m(+0.00184)


[4m[1m > EPOCH: 619/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:49:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 11150[0m
     | > loss: -0.44242  (-0.48058)
     | > log_mle: -0.57804  (-0.59658)
     | > loss_dur: 0.13562  (0.11600)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.47913  (13.05137)
     | > current_lr: 0.00015 
     | > step_time: 0.67860  (0.67074)
     | > loader_time: 0.39440  (0.41112)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00601)
     | > avg_loss:[92m 0.38177 [0m(-0.02379)
     | > avg_log_mle:[92m -0.44523 [0m(-0.00529)
     | > avg_loss_dur:[92m 0.82699 [0m(-0.01849)


[4m[1m > EPOCH: 620/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:50:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 11175[0m
     | > loss: -0.38537  (-0.46009)
     | > log_mle: -0.53682  (-0.58520)
     | > loss_dur: 0.15144  (0.12511)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.98716  (13.25891)
     | > current_lr: 0.00015 
     | > step_time: 0.88480  (0.75622)
     | > loader_time: 0.53050  (0.47623)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00501)
     | > avg_loss:[91m 0.38979 [0m(+0.00802)
     | > avg_log_mle:[92m -0.44982 [0m(-0.00459)
     | > avg_loss_dur:[91m 0.83961 [0m(+0.01262)


[4m[1m > EPOCH: 621/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:50:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00200)
     | > avg_loss:[91m 0.40322 [0m(+0.01343)
     | > avg_log_mle:[91m -0.44651 [0m(+0.00331)
     | > avg_loss_dur:[91m 0.84973 [0m(+0.01012)


[4m[1m > EPOCH: 622/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:51:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 11200[0m
     | > loss: -0.51439  (-0.53886)
     | > log_mle: -0.61809  (-0.63610)
     | > loss_dur: 0.10370  (0.09724)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.62269  (12.97338)
     | > current_lr: 0.00016 
     | > step_time: 0.73570  (0.66260)
     | > loader_time: 0.50650  (0.40737)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01201)
     | > avg_loss:[92m 0.34107 [0m(-0.06215)
     | > avg_log_mle:[92m -0.45281 [0m(-0.00630)
     | > avg_loss_dur:[92m 0.79388 [0m(-0.05585)


[4m[1m > EPOCH: 623/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:51:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 11225[0m
     | > loss: -0.44391  (-0.49929)
     | > log_mle: -0.56611  (-0.61014)
     | > loss_dur: 0.12221  (0.11085)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 33.91013  (17.34414)
     | > current_lr: 0.00016 
     | > step_time: 0.74370  (0.70146)
     | > loader_time: 0.46240  (0.45368)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00901)
     | > avg_loss:[91m 0.43769 [0m(+0.09662)
     | > avg_log_mle:[91m -0.44728 [0m(+0.00553)
     | > avg_loss_dur:[91m 0.88497 [0m(+0.09109)


[4m[1m > EPOCH: 624/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:52:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.00801)
     | > avg_loss:[92m 0.37844 [0m(-0.05925)
     | > avg_log_mle:[91m -0.43242 [0m(+0.01486)
     | > avg_loss_dur:[92m 0.81086 [0m(-0.07411)


[4m[1m > EPOCH: 625/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:52:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 11250[0m
     | > loss: -0.54635  (-0.54635)
     | > log_mle: -0.63792  (-0.63792)
     | > loss_dur: 0.09157  (0.09157)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.91642  (22.91642)
     | > current_lr: 0.00016 
     | > step_time: 0.50350  (0.50346)
     | > loader_time: 0.28730  (0.28726)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01301)
     | > avg_loss:[91m 0.46449 [0m(+0.08604)
     | > avg_log_mle:[92m -0.43736 [0m(-0.00494)
     | > avg_loss_dur:[91m 0.90185 [0m(+0.09099)


[4m[1m > EPOCH: 626/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:53:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 11275[0m
     | > loss: -0.46417  (-0.48987)
     | > log_mle: -0.59233  (-0.60269)
     | > loss_dur: 0.12816  (0.11281)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.16952  (16.92862)
     | > current_lr: 0.00016 
     | > step_time: 0.71160  (0.71579)
     | > loader_time: 0.48640  (0.45584)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00400)
     | > avg_loss:[92m 0.39821 [0m(-0.06628)
     | > avg_log_mle:[92m -0.44888 [0m(-0.01152)
     | > avg_loss_dur:[92m 0.84709 [0m(-0.05476)


[4m[1m > EPOCH: 627/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:54:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 11300[0m
     | > loss: -0.41320  (-0.47751)
     | > log_mle: -0.55506  (-0.59891)
     | > loss_dur: 0.14186  (0.12140)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 23.99052  (15.93061)
     | > current_lr: 0.00016 
     | > step_time: 1.01890  (0.75133)
     | > loader_time: 0.64860  (0.50181)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00701)
     | > avg_loss:[92m 0.35394 [0m(-0.04427)
     | > avg_log_mle:[91m -0.44385 [0m(+0.00503)
     | > avg_loss_dur:[92m 0.79779 [0m(-0.04930)


[4m[1m > EPOCH: 628/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:54:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00300)
     | > avg_loss:[91m 0.38196 [0m(+0.02802)
     | > avg_log_mle:[91m -0.41944 [0m(+0.02441)
     | > avg_loss_dur:[91m 0.80141 [0m(+0.00362)


[4m[1m > EPOCH: 629/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:55:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 11325[0m
     | > loss: -0.52645  (-0.52968)
     | > log_mle: -0.62881  (-0.62582)
     | > loss_dur: 0.10236  (0.09614)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.13521  (14.18551)
     | > current_lr: 0.00016 
     | > step_time: 0.69060  (0.63791)
     | > loader_time: 0.42040  (0.37801)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.01001)
     | > avg_loss:[92m 0.37571 [0m(-0.00625)
     | > avg_log_mle:[92m -0.44028 [0m(-0.02083)
     | > avg_loss_dur:[91m 0.81599 [0m(+0.01458)


[4m[1m > EPOCH: 630/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:55:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 11350[0m
     | > loss: -0.43318  (-0.49515)
     | > log_mle: -0.56410  (-0.61111)
     | > loss_dur: 0.13092  (0.11596)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.60354  (12.17604)
     | > current_lr: 0.00016 
     | > step_time: 0.87680  (0.76299)
     | > loader_time: 0.53050  (0.48204)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00300)
     | > avg_loss:[92m 0.35116 [0m(-0.02455)
     | > avg_log_mle:[91m -0.43703 [0m(+0.00325)
     | > avg_loss_dur:[92m 0.78819 [0m(-0.02780)


[4m[1m > EPOCH: 631/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:56:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 11375[0m
     | > loss: -0.40358  (-0.45907)
     | > log_mle: -0.54462  (-0.58495)
     | > loss_dur: 0.14104  (0.12587)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.63085  (15.39597)
     | > current_lr: 0.00016 
     | > step_time: 0.91880  (0.85784)
     | > loader_time: 0.57250  (0.54391)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08307 [0m(+0.01601)
     | > avg_loss:[91m 0.48468 [0m(+0.13352)
     | > avg_log_mle:[91m -0.42870 [0m(+0.00832)
     | > avg_loss_dur:[91m 0.91338 [0m(+0.12520)


[4m[1m > EPOCH: 632/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:56:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08508 [0m(+0.00200)
     | > avg_loss:[92m 0.41800 [0m(-0.06668)
     | > avg_log_mle:[92m -0.44490 [0m(-0.01620)
     | > avg_loss_dur:[92m 0.86290 [0m(-0.05048)


[4m[1m > EPOCH: 633/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:57:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 11400[0m
     | > loss: -0.45614  (-0.52325)
     | > log_mle: -0.58246  (-0.62593)
     | > loss_dur: 0.12632  (0.10268)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.35655  (11.95960)
     | > current_lr: 0.00016 
     | > step_time: 0.68560  (0.71749)
     | > loader_time: 0.45240  (0.45792)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07507 [0m(-0.01001)
     | > avg_loss:[92m 0.40243 [0m(-0.01557)
     | > avg_log_mle:[91m -0.40853 [0m(+0.03637)
     | > avg_loss_dur:[92m 0.81096 [0m(-0.05194)


[4m[1m > EPOCH: 634/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:57:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 11425[0m
     | > loss: -0.39341  (-0.46972)
     | > log_mle: -0.55175  (-0.59355)
     | > loss_dur: 0.15834  (0.12383)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.53487  (11.71819)
     | > current_lr: 0.00016 
     | > step_time: 0.79470  (0.72712)
     | > loader_time: 0.48440  (0.48513)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00801)
     | > avg_loss:[91m 0.43002 [0m(+0.02759)
     | > avg_log_mle:[92m -0.44081 [0m(-0.03228)
     | > avg_loss_dur:[91m 0.87083 [0m(+0.05987)


[4m[1m > EPOCH: 635/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:58:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.01001)
     | > avg_loss:[92m 0.32641 [0m(-0.10361)
     | > avg_log_mle:[92m -0.44301 [0m(-0.00220)
     | > avg_loss_dur:[92m 0.76942 [0m(-0.10141)


[4m[1m > EPOCH: 636/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:59:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 11450[0m
     | > loss: -0.55400  (-0.56117)
     | > log_mle: -0.64192  (-0.64823)
     | > loss_dur: 0.08792  (0.08706)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.21153  (14.56528)
     | > current_lr: 0.00016 
     | > step_time: 0.58050  (0.61756)
     | > loader_time: 0.35330  (0.37884)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07707 [0m(+0.00000)
     | > avg_loss:[91m 0.36911 [0m(+0.04270)
     | > avg_log_mle:[91m -0.43408 [0m(+0.00892)
     | > avg_loss_dur:[91m 0.80319 [0m(+0.03377)


[4m[1m > EPOCH: 637/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 11:59:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 11475[0m
     | > loss: -0.46771  (-0.50942)
     | > log_mle: -0.59676  (-0.62014)
     | > loss_dur: 0.12905  (0.11073)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.86497  (11.39516)
     | > current_lr: 0.00016 
     | > step_time: 0.89280  (0.70753)
     | > loader_time: 0.59450  (0.46264)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08107 [0m(+0.00400)
     | > avg_loss:[91m 0.37461 [0m(+0.00550)
     | > avg_log_mle:[92m -0.43453 [0m(-0.00045)
     | > avg_loss_dur:[91m 0.80915 [0m(+0.00595)


[4m[1m > EPOCH: 638/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:00:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 11500[0m
     | > loss: -0.41785  (-0.47338)
     | > log_mle: -0.55125  (-0.59419)
     | > loss_dur: 0.13340  (0.12080)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.19996  (16.12086)
     | > current_lr: 0.00016 
     | > step_time: 0.96590  (0.82231)
     | > loader_time: 0.67060  (0.54750)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.01301)
     | > avg_loss:[92m 0.36614 [0m(-0.00848)
     | > avg_log_mle:[92m -0.44151 [0m(-0.00697)
     | > avg_loss_dur:[92m 0.80765 [0m(-0.00150)


[4m[1m > EPOCH: 639/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:00:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08408 [0m(+0.01602)
     | > avg_loss:[92m 0.34498 [0m(-0.02115)
     | > avg_log_mle:[91m -0.43506 [0m(+0.00645)
     | > avg_loss_dur:[92m 0.78004 [0m(-0.02761)


[4m[1m > EPOCH: 640/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:01:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 11525[0m
     | > loss: -0.49857  (-0.53196)
     | > log_mle: -0.60770  (-0.63067)
     | > loss_dur: 0.10913  (0.09871)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.78382  (8.95948)
     | > current_lr: 0.00016 
     | > step_time: 0.74670  (0.75480)
     | > loader_time: 0.42840  (0.47443)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07607 [0m(-0.00801)
     | > avg_loss:[91m 0.39286 [0m(+0.04787)
     | > avg_log_mle:[92m -0.43877 [0m(-0.00371)
     | > avg_loss_dur:[91m 0.83162 [0m(+0.05158)


[4m[1m > EPOCH: 641/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:01:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 11550[0m
     | > loss: -0.43428  (-0.48997)
     | > log_mle: -0.56184  (-0.60449)
     | > loss_dur: 0.12756  (0.11452)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.85310  (13.58522)
     | > current_lr: 0.00016 
     | > step_time: 0.92080  (0.76528)
     | > loader_time: 0.66360  (0.48152)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.09008 [0m(+0.01401)
     | > avg_loss:[92m 0.36940 [0m(-0.02345)
     | > avg_log_mle:[92m -0.44245 [0m(-0.00368)
     | > avg_loss_dur:[92m 0.81185 [0m(-0.01977)


[4m[1m > EPOCH: 642/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:02:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.01802)
     | > avg_loss:[91m 0.41797 [0m(+0.04857)
     | > avg_log_mle:[91m -0.42742 [0m(+0.01503)
     | > avg_loss_dur:[91m 0.84539 [0m(+0.03354)


[4m[1m > EPOCH: 643/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:02:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 11575[0m
     | > loss: -0.55081  (-0.55081)
     | > log_mle: -0.64008  (-0.64008)
     | > loss_dur: 0.08927  (0.08927)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.60022  (7.60022)
     | > current_lr: 0.00016 
     | > step_time: 0.65560  (0.65560)
     | > loader_time: 0.40340  (0.40337)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00200)
     | > avg_loss:[92m 0.36552 [0m(-0.05245)
     | > avg_log_mle:[92m -0.43729 [0m(-0.00988)
     | > avg_loss_dur:[92m 0.80281 [0m(-0.04257)


[4m[1m > EPOCH: 644/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:03:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 11600[0m
     | > loss: -0.48348  (-0.51696)
     | > log_mle: -0.61092  (-0.62559)
     | > loss_dur: 0.12744  (0.10863)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.57497  (11.90324)
     | > current_lr: 0.00016 
     | > step_time: 0.78170  (0.70689)
     | > loader_time: 0.55250  (0.46092)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.01301)
     | > avg_loss:[91m 0.36694 [0m(+0.00142)
     | > avg_log_mle:[92m -0.43779 [0m(-0.00050)
     | > avg_loss_dur:[91m 0.80473 [0m(+0.00192)


[4m[1m > EPOCH: 645/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:04:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 11625[0m
     | > loss: -0.41081  (-0.47865)
     | > log_mle: -0.55164  (-0.59755)
     | > loss_dur: 0.14083  (0.11889)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.56827  (13.24829)
     | > current_lr: 0.00016 
     | > step_time: 1.24610  (0.82895)
     | > loader_time: 0.55550  (0.51093)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06406 [0m(+0.00300)
     | > avg_loss:[91m 0.39155 [0m(+0.02461)
     | > avg_log_mle:[91m -0.43583 [0m(+0.00197)
     | > avg_loss_dur:[91m 0.82738 [0m(+0.02265)


[4m[1m > EPOCH: 646/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:04:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00901)
     | > avg_loss:[92m 0.32922 [0m(-0.06233)
     | > avg_log_mle:[92m -0.44452 [0m(-0.00869)
     | > avg_loss_dur:[92m 0.77374 [0m(-0.05364)


[4m[1m > EPOCH: 647/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:05:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 11650[0m
     | > loss: -0.54507  (-0.55428)
     | > log_mle: -0.63966  (-0.64668)
     | > loss_dur: 0.09459  (0.09240)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.77073  (20.83786)
     | > current_lr: 0.00016 
     | > step_time: 0.73570  (0.66260)
     | > loader_time: 0.51450  (0.43965)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00701)
     | > avg_loss:[91m 0.39336 [0m(+0.06414)
     | > avg_log_mle:[91m -0.43568 [0m(+0.00883)
     | > avg_loss_dur:[91m 0.82905 [0m(+0.05531)


[4m[1m > EPOCH: 648/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:05:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 11675[0m
     | > loss: -0.42879  (-0.49682)
     | > log_mle: -0.57092  (-0.61008)
     | > loss_dur: 0.14213  (0.11325)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.61425  (20.80324)
     | > current_lr: 0.00016 
     | > step_time: 0.74270  (0.70264)
     | > loader_time: 0.48540  (0.45978)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01201)
     | > avg_loss:[92m 0.31169 [0m(-0.08168)
     | > avg_log_mle:[92m -0.44358 [0m(-0.00790)
     | > avg_loss_dur:[92m 0.75527 [0m(-0.07378)


[4m[1m > EPOCH: 649/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:06:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00600)
     | > avg_loss:[91m 0.38820 [0m(+0.07651)
     | > avg_log_mle:[91m -0.43615 [0m(+0.00743)
     | > avg_loss_dur:[91m 0.82435 [0m(+0.06908)


[4m[1m > EPOCH: 650/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:06:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 11700[0m
     | > loss: -0.57241  (-0.57241)
     | > log_mle: -0.66549  (-0.66549)
     | > loss_dur: 0.09309  (0.09309)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.29262  (12.29262)
     | > current_lr: 0.00016 
     | > step_time: 0.77310  (0.77307)
     | > loader_time: 0.31330  (0.31328)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07306 [0m(+0.00100)
     | > avg_loss:[91m 0.40590 [0m(+0.01770)
     | > avg_log_mle:[92m -0.43931 [0m(-0.00315)
     | > avg_loss_dur:[91m 0.84521 [0m(+0.02086)


[4m[1m > EPOCH: 651/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:07:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 11725[0m
     | > loss: -0.48635  (-0.53425)
     | > log_mle: -0.61325  (-0.63741)
     | > loss_dur: 0.12690  (0.10316)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.30727  (14.35398)
     | > current_lr: 0.00016 
     | > step_time: 0.65060  (0.70350)
     | > loader_time: 0.44040  (0.45470)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00100)
     | > avg_loss:[92m 0.38287 [0m(-0.02304)
     | > avg_log_mle:[92m -0.44262 [0m(-0.00331)
     | > avg_loss_dur:[92m 0.82549 [0m(-0.01972)


[4m[1m > EPOCH: 652/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:07:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 11750[0m
     | > loss: -0.42692  (-0.50773)
     | > log_mle: -0.56307  (-0.61649)
     | > loss_dur: 0.13615  (0.10876)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.58381  (15.67786)
     | > current_lr: 0.00016 
     | > step_time: 1.08100  (0.80287)
     | > loader_time: 0.67160  (0.51232)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.39713 [0m(+0.01426)
     | > avg_log_mle:[91m -0.42877 [0m(+0.01384)
     | > avg_loss_dur:[91m 0.82591 [0m(+0.00042)


[4m[1m > EPOCH: 653/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:08:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00500)
     | > avg_loss:[91m 0.43723 [0m(+0.04010)
     | > avg_log_mle:[92m -0.44192 [0m(-0.01315)
     | > avg_loss_dur:[91m 0.87915 [0m(+0.05325)


[4m[1m > EPOCH: 654/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:08:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 11775[0m
     | > loss: -0.56366  (-0.56958)
     | > log_mle: -0.65889  (-0.65814)
     | > loss_dur: 0.09523  (0.08856)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.79879  (6.70482)
     | > current_lr: 0.00016 
     | > step_time: 0.70060  (0.68162)
     | > loader_time: 0.43740  (0.40370)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[92m 0.40458 [0m(-0.03265)
     | > avg_log_mle:[91m -0.43326 [0m(+0.00866)
     | > avg_loss_dur:[92m 0.83783 [0m(-0.04132)


[4m[1m > EPOCH: 655/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:09:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 11800[0m
     | > loss: -0.48257  (-0.51334)
     | > log_mle: -0.59308  (-0.62320)
     | > loss_dur: 0.11050  (0.10987)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.00642  (13.55887)
     | > current_lr: 0.00016 
     | > step_time: 0.79770  (0.74308)
     | > loader_time: 0.61860  (0.48904)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00100)
     | > avg_loss:[92m 0.35044 [0m(-0.05414)
     | > avg_log_mle:[92m -0.44643 [0m(-0.01318)
     | > avg_loss_dur:[92m 0.79687 [0m(-0.04096)


[4m[1m > EPOCH: 656/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:10:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 11825[0m
     | > loss: -0.43466  (-0.46777)
     | > log_mle: -0.56022  (-0.59213)
     | > loss_dur: 0.12556  (0.12436)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.59078  (17.79817)
     | > current_lr: 0.00016 
     | > step_time: 0.91380  (0.82016)
     | > loader_time: 0.50450  (0.54850)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08007 [0m(+0.00300)
     | > avg_loss:[91m 0.44633 [0m(+0.09590)
     | > avg_log_mle:[91m -0.43369 [0m(+0.01275)
     | > avg_loss_dur:[91m 0.88002 [0m(+0.08315)


[4m[1m > EPOCH: 657/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:10:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.01702)
     | > avg_loss:[91m 0.45458 [0m(+0.00824)
     | > avg_log_mle:[92m -0.44289 [0m(-0.00920)
     | > avg_loss_dur:[91m 0.89746 [0m(+0.01744)


[4m[1m > EPOCH: 658/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:11:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 11850[0m
     | > loss: -0.46294  (-0.54268)
     | > log_mle: -0.58773  (-0.63952)
     | > loss_dur: 0.12479  (0.09684)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 26.27403  (20.16907)
     | > current_lr: 0.00016 
     | > step_time: 0.64260  (0.67361)
     | > loader_time: 0.44440  (0.42822)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.01001)
     | > avg_loss:[92m 0.39490 [0m(-0.05968)
     | > avg_log_mle:[91m -0.42803 [0m(+0.01485)
     | > avg_loss_dur:[92m 0.82294 [0m(-0.07453)


[4m[1m > EPOCH: 659/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:11:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 11875[0m
     | > loss: -0.44243  (-0.51263)
     | > log_mle: -0.56823  (-0.62009)
     | > loss_dur: 0.12580  (0.10746)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.43179  (13.97226)
     | > current_lr: 0.00016 
     | > step_time: 0.78970  (0.72697)
     | > loader_time: 0.49640  (0.46596)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00000)
     | > avg_loss:[92m 0.37669 [0m(-0.01821)
     | > avg_log_mle:[92m -0.43534 [0m(-0.00731)
     | > avg_loss_dur:[92m 0.81203 [0m(-0.01090)


[4m[1m > EPOCH: 660/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:12:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08208 [0m(+0.00901)
     | > avg_loss:[92m 0.36617 [0m(-0.01053)
     | > avg_log_mle:[92m -0.43665 [0m(-0.00131)
     | > avg_loss_dur:[92m 0.80282 [0m(-0.00922)


[4m[1m > EPOCH: 661/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:12:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 11900[0m
     | > loss: -0.57954  (-0.59282)
     | > log_mle: -0.66472  (-0.67298)
     | > loss_dur: 0.08518  (0.08016)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.74341  (9.66646)
     | > current_lr: 0.00017 
     | > step_time: 0.56550  (0.61606)
     | > loader_time: 0.38430  (0.40036)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07607 [0m(-0.00601)
     | > avg_loss:[91m 0.43596 [0m(+0.06979)
     | > avg_log_mle:[91m -0.43634 [0m(+0.00031)
     | > avg_loss_dur:[91m 0.87230 [0m(+0.06948)


[4m[1m > EPOCH: 662/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:13:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 11925[0m
     | > loss: -0.52996  (-0.53624)
     | > log_mle: -0.63542  (-0.63798)
     | > loss_dur: 0.10546  (0.10174)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.92884  (17.43414)
     | > current_lr: 0.00017 
     | > step_time: 0.87780  (0.69663)
     | > loader_time: 0.56850  (0.43818)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00701)
     | > avg_loss:[92m 0.35709 [0m(-0.07887)
     | > avg_log_mle:[91m -0.43285 [0m(+0.00349)
     | > avg_loss_dur:[92m 0.78994 [0m(-0.08236)


[4m[1m > EPOCH: 663/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:13:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 11950[0m
     | > loss: -0.41417  (-0.49418)
     | > log_mle: -0.54092  (-0.60792)
     | > loss_dur: 0.12675  (0.11374)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 54.42512  (16.88486)
     | > current_lr: 0.00017 
     | > step_time: 0.95790  (0.77414)
     | > loader_time: 0.58150  (0.49076)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00400)
     | > avg_loss:[91m 0.40994 [0m(+0.05286)
     | > avg_log_mle:[91m -0.42090 [0m(+0.01195)
     | > avg_loss_dur:[91m 0.83084 [0m(+0.04091)


[4m[1m > EPOCH: 664/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:14:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00501)
     | > avg_loss:[91m 0.46557 [0m(+0.05563)
     | > avg_log_mle:[91m -0.41045 [0m(+0.01045)
     | > avg_loss_dur:[91m 0.87602 [0m(+0.04518)


[4m[1m > EPOCH: 665/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:14:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 11975[0m
     | > loss: -0.48092  (-0.54088)
     | > log_mle: -0.60316  (-0.63794)
     | > loss_dur: 0.12224  (0.09706)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.27834  (13.75676)
     | > current_lr: 0.00017 
     | > step_time: 0.74870  (0.68122)
     | > loader_time: 0.44040  (0.41057)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00000)
     | > avg_loss:[92m 0.41045 [0m(-0.05512)
     | > avg_log_mle:[92m -0.42207 [0m(-0.01162)
     | > avg_loss_dur:[92m 0.83251 [0m(-0.04351)


[4m[1m > EPOCH: 666/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:15:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 12000[0m
     | > loss: -0.47687  (-0.51265)
     | > log_mle: -0.60087  (-0.62383)
     | > loss_dur: 0.12399  (0.11118)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.67801  (12.50547)
     | > current_lr: 0.00017 
     | > step_time: 0.92180  (0.72074)
     | > loader_time: 0.66360  (0.45900)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[92m 0.33878 [0m(-0.07167)
     | > avg_log_mle:[92m -0.43035 [0m(-0.00828)
     | > avg_loss_dur:[92m 0.76912 [0m(-0.06339)


[4m[1m > EPOCH: 667/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:16:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[91m 0.36928 [0m(+0.03050)
     | > avg_log_mle:[92m -0.43643 [0m(-0.00608)
     | > avg_loss_dur:[91m 0.80571 [0m(+0.03659)


[4m[1m > EPOCH: 668/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:16:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 12025[0m
     | > loss: -0.59627  (-0.59627)
     | > log_mle: -0.67381  (-0.67381)
     | > loss_dur: 0.07754  (0.07754)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.79122  (12.79122)
     | > current_lr: 0.00017 
     | > step_time: 0.66060  (0.66060)
     | > loader_time: 0.36330  (0.36333)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00701)
     | > avg_loss:[91m 0.38256 [0m(+0.01328)
     | > avg_log_mle:[92m -0.43756 [0m(-0.00113)
     | > avg_loss_dur:[91m 0.82012 [0m(+0.01441)


[4m[1m > EPOCH: 669/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:17:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 12050[0m
     | > loss: -0.51530  (-0.54891)
     | > log_mle: -0.62742  (-0.64606)
     | > loss_dur: 0.11212  (0.09715)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.12720  (12.66370)
     | > current_lr: 0.00017 
     | > step_time: 0.68260  (0.67261)
     | > loader_time: 0.44440  (0.43114)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00901)
     | > avg_loss:[91m 0.38622 [0m(+0.00366)
     | > avg_log_mle:[91m -0.42362 [0m(+0.01394)
     | > avg_loss_dur:[92m 0.80984 [0m(-0.01028)


[4m[1m > EPOCH: 670/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:17:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 12075[0m
     | > loss: -0.42770  (-0.50178)
     | > log_mle: -0.55575  (-0.61307)
     | > loss_dur: 0.12804  (0.11129)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.53602  (12.68541)
     | > current_lr: 0.00017 
     | > step_time: 0.88180  (0.75776)
     | > loader_time: 0.55350  (0.48544)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00500)
     | > avg_loss:[92m 0.34193 [0m(-0.04429)
     | > avg_log_mle:[92m -0.43356 [0m(-0.00994)
     | > avg_loss_dur:[92m 0.77549 [0m(-0.03435)


[4m[1m > EPOCH: 671/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:18:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[91m 0.40872 [0m(+0.06679)
     | > avg_log_mle:[91m -0.41911 [0m(+0.01445)
     | > avg_loss_dur:[91m 0.82783 [0m(+0.05234)


[4m[1m > EPOCH: 672/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:18:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 12100[0m
     | > loss: -0.54608  (-0.57024)
     | > log_mle: -0.64755  (-0.65981)
     | > loss_dur: 0.10147  (0.08957)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.54318  (7.98762)
     | > current_lr: 0.00017 
     | > step_time: 0.73770  (0.66260)
     | > loader_time: 0.50650  (0.40812)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00300)
     | > avg_loss:[92m 0.39317 [0m(-0.01555)
     | > avg_log_mle:[92m -0.43457 [0m(-0.01546)
     | > avg_loss_dur:[92m 0.82774 [0m(-0.00009)


[4m[1m > EPOCH: 673/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:19:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 12125[0m
     | > loss: -0.47002  (-0.52934)
     | > log_mle: -0.59238  (-0.63474)
     | > loss_dur: 0.12236  (0.10541)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.88937  (9.51855)
     | > current_lr: 0.00017 
     | > step_time: 0.74570  (0.70127)
     | > loader_time: 0.50050  (0.44231)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00300)
     | > avg_loss:[92m 0.38851 [0m(-0.00466)
     | > avg_log_mle:[91m -0.41660 [0m(+0.01797)
     | > avg_loss_dur:[92m 0.80511 [0m(-0.02263)


[4m[1m > EPOCH: 674/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:19:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00400)
     | > avg_loss:[91m 0.44019 [0m(+0.05168)
     | > avg_log_mle:[92m -0.43147 [0m(-0.01487)
     | > avg_loss_dur:[91m 0.87166 [0m(+0.06656)


[4m[1m > EPOCH: 675/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:20:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 12150[0m
     | > loss: -0.60147  (-0.60147)
     | > log_mle: -0.67796  (-0.67796)
     | > loss_dur: 0.07649  (0.07649)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.20551  (21.20551)
     | > current_lr: 0.00017 
     | > step_time: 0.50550  (0.50546)
     | > loader_time: 0.27220  (0.27225)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00801)
     | > avg_loss:[92m 0.42533 [0m(-0.01487)
     | > avg_log_mle:[92m -0.43489 [0m(-0.00342)
     | > avg_loss_dur:[92m 0.86022 [0m(-0.01144)


[4m[1m > EPOCH: 676/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:20:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 12175[0m
     | > loss: -0.49087  (-0.54612)
     | > log_mle: -0.61186  (-0.64514)
     | > loss_dur: 0.12099  (0.09902)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.83846  (12.64319)
     | > current_lr: 0.00017 
     | > step_time: 0.64260  (0.66932)
     | > loader_time: 0.41540  (0.41924)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.01001)
     | > avg_loss:[92m 0.38978 [0m(-0.03555)
     | > avg_log_mle:[91m -0.42312 [0m(+0.01177)
     | > avg_loss_dur:[92m 0.81290 [0m(-0.04733)


[4m[1m > EPOCH: 677/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:21:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 12200[0m
     | > loss: -0.43433  (-0.50461)
     | > log_mle: -0.56824  (-0.61651)
     | > loss_dur: 0.13391  (0.11190)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.45799  (12.14740)
     | > current_lr: 0.00017 
     | > step_time: 1.02690  (0.74732)
     | > loader_time: 0.60350  (0.47229)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00300)
     | > avg_loss:[92m 0.37888 [0m(-0.01090)
     | > avg_log_mle:[92m -0.42868 [0m(-0.00556)
     | > avg_loss_dur:[92m 0.80756 [0m(-0.00533)


[4m[1m > EPOCH: 678/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:21:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00701)
     | > avg_loss:[91m 0.40055 [0m(+0.02167)
     | > avg_log_mle:[91m -0.41799 [0m(+0.01069)
     | > avg_loss_dur:[91m 0.81854 [0m(+0.01098)


[4m[1m > EPOCH: 679/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:22:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 12225[0m
     | > loss: -0.57733  (-0.58371)
     | > log_mle: -0.66583  (-0.66893)
     | > loss_dur: 0.08850  (0.08523)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 23.69672  (18.38615)
     | > current_lr: 0.00017 
     | > step_time: 0.69660  (0.64058)
     | > loader_time: 0.46340  (0.42172)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00400)
     | > avg_loss:[91m 0.40300 [0m(+0.00246)
     | > avg_log_mle:[91m -0.41456 [0m(+0.00343)
     | > avg_loss_dur:[92m 0.81757 [0m(-0.00097)


[4m[1m > EPOCH: 680/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:22:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 12250[0m
     | > loss: -0.49611  (-0.54111)
     | > log_mle: -0.60707  (-0.64241)
     | > loss_dur: 0.11096  (0.10130)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.32071  (13.22405)
     | > current_lr: 0.00017 
     | > step_time: 0.71160  (0.69353)
     | > loader_time: 0.42940  (0.43189)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00000)
     | > avg_loss:[92m 0.38571 [0m(-0.01729)
     | > avg_log_mle:[92m -0.41657 [0m(-0.00200)
     | > avg_loss_dur:[92m 0.80228 [0m(-0.01529)


[4m[1m > EPOCH: 681/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:23:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 12275[0m
     | > loss: -0.43567  (-0.50029)
     | > log_mle: -0.56071  (-0.61392)
     | > loss_dur: 0.12504  (0.11363)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.87561  (16.22779)
     | > current_lr: 0.00017 
     | > step_time: 0.84880  (0.76988)
     | > loader_time: 0.40940  (0.48597)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00300)
     | > avg_loss:[91m 0.43539 [0m(+0.04968)
     | > avg_log_mle:[92m -0.42580 [0m(-0.00923)
     | > avg_loss_dur:[91m 0.86119 [0m(+0.05891)


[4m[1m > EPOCH: 682/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:23:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00701)
     | > avg_loss:[92m 0.35696 [0m(-0.07842)
     | > avg_log_mle:[91m -0.42337 [0m(+0.00243)
     | > avg_loss_dur:[92m 0.78033 [0m(-0.08085)


[4m[1m > EPOCH: 683/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:24:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 12300[0m
     | > loss: -0.50980  (-0.56192)
     | > log_mle: -0.61634  (-0.65328)
     | > loss_dur: 0.10653  (0.09136)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.48733  (11.96568)
     | > current_lr: 0.00017 
     | > step_time: 0.63960  (0.67011)
     | > loader_time: 0.39840  (0.41104)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.01101)
     | > avg_loss:[91m 0.39982 [0m(+0.04286)
     | > avg_log_mle:[91m -0.42272 [0m(+0.00065)
     | > avg_loss_dur:[91m 0.82254 [0m(+0.04221)


[4m[1m > EPOCH: 684/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:24:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 12325[0m
     | > loss: -0.47066  (-0.53517)
     | > log_mle: -0.58314  (-0.63654)
     | > loss_dur: 0.11248  (0.10137)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.46218  (21.46412)
     | > current_lr: 0.00017 
     | > step_time: 0.79070  (0.72081)
     | > loader_time: 0.51350  (0.46966)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00100)
     | > avg_loss:[92m 0.39970 [0m(-0.00012)
     | > avg_log_mle:[91m -0.42035 [0m(+0.00237)
     | > avg_loss_dur:[92m 0.82005 [0m(-0.00249)


[4m[1m > EPOCH: 685/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:25:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00200)
     | > avg_loss:[91m 0.40477 [0m(+0.00506)
     | > avg_log_mle:[92m -0.42087 [0m(-0.00052)
     | > avg_loss_dur:[91m 0.82564 [0m(+0.00559)


[4m[1m > EPOCH: 686/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:26:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 12350[0m
     | > loss: -0.58797  (-0.59132)
     | > log_mle: -0.67298  (-0.67475)
     | > loss_dur: 0.08501  (0.08343)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.16440  (12.01969)
     | > current_lr: 0.00017 
     | > step_time: 0.56850  (0.61806)
     | > loader_time: 0.39840  (0.39836)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00200)
     | > avg_loss:[91m 0.46366 [0m(+0.05889)
     | > avg_log_mle:[92m -0.42685 [0m(-0.00598)
     | > avg_loss_dur:[91m 0.89051 [0m(+0.06487)


[4m[1m > EPOCH: 687/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:26:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 12375[0m
     | > loss: -0.51113  (-0.53677)
     | > log_mle: -0.62664  (-0.64221)
     | > loss_dur: 0.11551  (0.10543)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.45348  (14.79782)
     | > current_lr: 0.00017 
     | > step_time: 0.87180  (0.68996)
     | > loader_time: 0.80570  (0.45085)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[92m 0.37044 [0m(-0.09322)
     | > avg_log_mle:[91m -0.41991 [0m(+0.00694)
     | > avg_loss_dur:[92m 0.79035 [0m(-0.10016)


[4m[1m > EPOCH: 688/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:27:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 12400[0m
     | > loss: -0.42979  (-0.50027)
     | > log_mle: -0.55905  (-0.61282)
     | > loss_dur: 0.12926  (0.11255)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 3.31381  (12.78545)
     | > current_lr: 0.00017 
     | > step_time: 0.94790  (0.76391)
     | > loader_time: 0.57450  (0.48112)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00901)
     | > avg_loss:[91m 0.46285 [0m(+0.09241)
     | > avg_log_mle:[92m -0.42958 [0m(-0.00967)
     | > avg_loss_dur:[91m 0.89243 [0m(+0.10208)


[4m[1m > EPOCH: 689/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:27:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00500)
     | > avg_loss:[92m 0.43573 [0m(-0.02712)
     | > avg_log_mle:[91m -0.41760 [0m(+0.01198)
     | > avg_loss_dur:[92m 0.85333 [0m(-0.03910)


[4m[1m > EPOCH: 690/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:28:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 12425[0m
     | > loss: -0.52047  (-0.57005)
     | > log_mle: -0.63189  (-0.66281)
     | > loss_dur: 0.11142  (0.09276)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.30442  (11.72520)
     | > current_lr: 0.00017 
     | > step_time: 0.74370  (0.67962)
     | > loader_time: 0.44540  (0.41278)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00701)
     | > avg_loss:[92m 0.38304 [0m(-0.05268)
     | > avg_log_mle:[91m -0.40547 [0m(+0.01213)
     | > avg_loss_dur:[92m 0.78851 [0m(-0.06481)


[4m[1m > EPOCH: 691/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:28:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 12450[0m
     | > loss: -0.46438  (-0.53550)
     | > log_mle: -0.58873  (-0.63596)
     | > loss_dur: 0.12435  (0.10046)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.26416  (14.76628)
     | > current_lr: 0.00017 
     | > step_time: 0.91080  (0.71573)
     | > loader_time: 0.64760  (0.45341)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[91m 0.40230 [0m(+0.01926)
     | > avg_log_mle:[92m -0.42648 [0m(-0.02101)
     | > avg_loss_dur:[91m 0.82879 [0m(+0.04027)


[4m[1m > EPOCH: 692/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:29:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00400)
     | > avg_loss:[91m 0.40471 [0m(+0.00241)
     | > avg_log_mle:[91m -0.42158 [0m(+0.00490)
     | > avg_loss_dur:[92m 0.82629 [0m(-0.00249)


[4m[1m > EPOCH: 693/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:29:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 12475[0m
     | > loss: -0.59778  (-0.59778)
     | > log_mle: -0.68218  (-0.68218)
     | > loss_dur: 0.08440  (0.08440)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.71086  (11.71086)
     | > current_lr: 0.00017 
     | > step_time: 0.64860  (0.64859)
     | > loader_time: 0.38030  (0.38035)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00300)
     | > avg_loss:[91m 0.44120 [0m(+0.03649)
     | > avg_log_mle:[92m -0.42514 [0m(-0.00355)
     | > avg_loss_dur:[91m 0.86633 [0m(+0.04004)


[4m[1m > EPOCH: 694/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:30:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 12500[0m
     | > loss: -0.54886  (-0.56340)
     | > log_mle: -0.65225  (-0.65717)
     | > loss_dur: 0.10339  (0.09377)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.03802  (12.10110)
     | > current_lr: 0.00017 
     | > step_time: 0.69560  (0.67061)
     | > loader_time: 0.42840  (0.42276)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[92m 0.44034 [0m(-0.00086)
     | > avg_log_mle:[91m -0.41930 [0m(+0.00584)
     | > avg_loss_dur:[92m 0.85964 [0m(-0.00669)


[4m[1m > EPOCH: 695/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:30:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 12525[0m
     | > loss: -0.42826  (-0.50948)
     | > log_mle: -0.55463  (-0.61964)
     | > loss_dur: 0.12637  (0.11016)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 27.60855  (15.64353)
     | > current_lr: 0.00017 
     | > step_time: 0.88080  (0.75168)
     | > loader_time: 0.53950  (0.47076)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00400)
     | > avg_loss:[91m 0.46124 [0m(+0.02090)
     | > avg_log_mle:[92m -0.42089 [0m(-0.00160)
     | > avg_loss_dur:[91m 0.88214 [0m(+0.02250)


[4m[1m > EPOCH: 696/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:31:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00300)
     | > avg_loss:[92m 0.43794 [0m(-0.02330)
     | > avg_log_mle:[91m -0.42081 [0m(+0.00008)
     | > avg_loss_dur:[92m 0.85875 [0m(-0.02339)


[4m[1m > EPOCH: 697/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:31:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 12550[0m
     | > loss: -0.54926  (-0.57172)
     | > log_mle: -0.65088  (-0.66195)
     | > loss_dur: 0.10162  (0.09023)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.87774  (19.37980)
     | > current_lr: 0.00017 
     | > step_time: 0.73170  (0.66260)
     | > loader_time: 0.50450  (0.42814)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00300)
     | > avg_loss:[92m 0.40259 [0m(-0.03535)
     | > avg_log_mle:[92m -0.42390 [0m(-0.00309)
     | > avg_loss_dur:[92m 0.82649 [0m(-0.03226)


[4m[1m > EPOCH: 698/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:32:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 12575[0m
     | > loss: -0.49201  (-0.54286)
     | > log_mle: -0.60414  (-0.64115)
     | > loss_dur: 0.11213  (0.09829)
     | > amp_scaler: 16384.00000  (8936.72727)
     | > grad_norm: 20.04655  (21.07131)
     | > current_lr: 0.00017 
     | > step_time: 0.73870  (0.69700)
     | > loader_time: 0.50050  (0.46797)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00200)
     | > avg_loss:[91m 0.42175 [0m(+0.01916)
     | > avg_log_mle:[91m -0.41851 [0m(+0.00539)
     | > avg_loss_dur:[91m 0.84026 [0m(+0.01377)


[4m[1m > EPOCH: 699/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:32:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00000)
     | > avg_loss:[92m 0.37875 [0m(-0.04300)
     | > avg_log_mle:[91m -0.41739 [0m(+0.00112)
     | > avg_loss_dur:[92m 0.79614 [0m(-0.04412)


[4m[1m > EPOCH: 700/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:33:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 12600[0m
     | > loss: -0.60255  (-0.60255)
     | > log_mle: -0.68466  (-0.68466)
     | > loss_dur: 0.08211  (0.08211)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.21678  (11.21678)
     | > current_lr: 0.00017 
     | > step_time: 0.60250  (0.60255)
     | > loader_time: 0.28520  (0.28525)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00500)
     | > avg_loss:[91m 0.39964 [0m(+0.02090)
     | > avg_log_mle:[92m -0.41769 [0m(-0.00030)
     | > avg_loss_dur:[91m 0.81733 [0m(+0.02119)


[4m[1m > EPOCH: 701/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:33:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 12625[0m
     | > loss: -0.53006  (-0.55186)
     | > log_mle: -0.63679  (-0.65167)
     | > loss_dur: 0.10674  (0.09981)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 19.18425  (14.46443)
     | > current_lr: 0.00018 
     | > step_time: 0.65960  (0.67133)
     | > loader_time: 0.40040  (0.40909)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00801)
     | > avg_loss:[92m 0.38658 [0m(-0.01307)
     | > avg_log_mle:[92m -0.42399 [0m(-0.00631)
     | > avg_loss_dur:[92m 0.81057 [0m(-0.00676)


[4m[1m > EPOCH: 702/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:34:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 12650[0m
     | > loss: -0.43589  (-0.52415)
     | > log_mle: -0.56966  (-0.63299)
     | > loss_dur: 0.13377  (0.10884)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.28110  (9.13994)
     | > current_lr: 0.00018 
     | > step_time: 1.01890  (0.73996)
     | > loader_time: 0.62160  (0.48058)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[91m 0.47372 [0m(+0.08714)
     | > avg_log_mle:[91m -0.40283 [0m(+0.02116)
     | > avg_loss_dur:[91m 0.87655 [0m(+0.06598)


[4m[1m > EPOCH: 703/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:34:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00100)
     | > avg_loss:[92m 0.38024 [0m(-0.09347)
     | > avg_log_mle:[92m -0.41979 [0m(-0.01696)
     | > avg_loss_dur:[92m 0.80003 [0m(-0.07651)


[4m[1m > EPOCH: 704/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:35:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 12675[0m
     | > loss: -0.57518  (-0.58924)
     | > log_mle: -0.66724  (-0.67613)
     | > loss_dur: 0.09207  (0.08689)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.33402  (10.09118)
     | > current_lr: 0.00018 
     | > step_time: 0.68460  (0.63324)
     | > loader_time: 0.43440  (0.39169)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[91m 0.38350 [0m(+0.00325)
     | > avg_log_mle:[91m -0.41521 [0m(+0.00458)
     | > avg_loss_dur:[92m 0.79871 [0m(-0.00133)


[4m[1m > EPOCH: 705/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:35:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 12700[0m
     | > loss: -0.50707  (-0.55482)
     | > log_mle: -0.61459  (-0.65163)
     | > loss_dur: 0.10752  (0.09682)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.99247  (14.83488)
     | > current_lr: 0.00018 
     | > step_time: 0.70260  (0.69542)
     | > loader_time: 0.48840  (0.43750)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00200)
     | > avg_loss:[91m 0.42286 [0m(+0.03937)
     | > avg_log_mle:[92m -0.41666 [0m(-0.00144)
     | > avg_loss_dur:[91m 0.83952 [0m(+0.04081)


[4m[1m > EPOCH: 706/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:36:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 12725[0m
     | > loss: -0.46656  (-0.51795)
     | > log_mle: -0.57490  (-0.62259)
     | > loss_dur: 0.10834  (0.10464)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 21.45542  (13.11261)
     | > current_lr: 0.00018 
     | > step_time: 0.84480  (0.76764)
     | > loader_time: 0.42240  (0.48309)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00100)
     | > avg_loss:[92m 0.40484 [0m(-0.01802)
     | > avg_log_mle:[91m -0.41226 [0m(+0.00440)
     | > avg_loss_dur:[92m 0.81710 [0m(-0.02242)


[4m[1m > EPOCH: 707/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:36:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00000)
     | > avg_loss:[91m 0.41304 [0m(+0.00820)
     | > avg_log_mle:[92m -0.41238 [0m(-0.00012)
     | > avg_loss_dur:[91m 0.82542 [0m(+0.00832)


[4m[1m > EPOCH: 708/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:37:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 12750[0m
     | > loss: -0.52001  (-0.57401)
     | > log_mle: -0.62918  (-0.66374)
     | > loss_dur: 0.10917  (0.08973)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.62494  (14.86830)
     | > current_lr: 0.00018 
     | > step_time: 0.63760  (0.67111)
     | > loader_time: 0.41040  (0.41638)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00300)
     | > avg_loss:[91m 0.42582 [0m(+0.01278)
     | > avg_log_mle:[92m -0.42088 [0m(-0.00850)
     | > avg_loss_dur:[91m 0.84670 [0m(+0.02128)


[4m[1m > EPOCH: 709/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:38:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 12775[0m
     | > loss: -0.44849  (-0.54252)
     | > log_mle: -0.58091  (-0.64400)
     | > loss_dur: 0.13242  (0.10148)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 33.88670  (13.44251)
     | > current_lr: 0.00018 
     | > step_time: 0.79270  (0.72089)
     | > loader_time: 0.48040  (0.48482)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00300)
     | > avg_loss:[91m 0.42904 [0m(+0.00322)
     | > avg_log_mle:[91m -0.41492 [0m(+0.00596)
     | > avg_loss_dur:[92m 0.84396 [0m(-0.00274)


[4m[1m > EPOCH: 710/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:38:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00500)
     | > avg_loss:[91m 0.44486 [0m(+0.01582)
     | > avg_log_mle:[91m -0.41325 [0m(+0.00166)
     | > avg_loss_dur:[91m 0.85812 [0m(+0.01416)


[4m[1m > EPOCH: 711/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:39:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 12800[0m
     | > loss: -0.60090  (-0.60133)
     | > log_mle: -0.68137  (-0.68220)
     | > loss_dur: 0.08048  (0.08087)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 15.97673  (11.42353)
     | > current_lr: 0.00018 
     | > step_time: 0.56250  (0.60455)
     | > loader_time: 0.37330  (0.37134)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00501)
     | > avg_loss:[92m 0.41667 [0m(-0.02819)
     | > avg_log_mle:[91m -0.41039 [0m(+0.00287)
     | > avg_loss_dur:[92m 0.82706 [0m(-0.03106)


[4m[1m > EPOCH: 712/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:39:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 12825[0m
     | > loss: -0.52197  (-0.54961)
     | > log_mle: -0.63976  (-0.64982)
     | > loss_dur: 0.11779  (0.10021)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.89588  (10.07300)
     | > current_lr: 0.00018 
     | > step_time: 0.87680  (0.69419)
     | > loader_time: 0.59850  (0.44507)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00400)
     | > avg_loss:[91m 0.42190 [0m(+0.00523)
     | > avg_log_mle:[92m -0.41227 [0m(-0.00188)
     | > avg_loss_dur:[91m 0.83417 [0m(+0.00711)


[4m[1m > EPOCH: 713/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:40:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 12850[0m
     | > loss: -0.45260  (-0.51329)
     | > log_mle: -0.57234  (-0.62445)
     | > loss_dur: 0.11974  (0.11115)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.38482  (13.42871)
     | > current_lr: 0.00018 
     | > step_time: 0.95090  (0.76213)
     | > loader_time: 0.61660  (0.48475)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00801)
     | > avg_loss:[92m 0.41095 [0m(-0.01096)
     | > avg_log_mle:[92m -0.41989 [0m(-0.00762)
     | > avg_loss_dur:[92m 0.83084 [0m(-0.00334)


[4m[1m > EPOCH: 714/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:40:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00000)
     | > avg_loss:[91m 0.42752 [0m(+0.01658)
     | > avg_log_mle:[91m -0.40958 [0m(+0.01032)
     | > avg_loss_dur:[91m 0.83710 [0m(+0.00626)


[4m[1m > EPOCH: 715/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:41:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 12875[0m
     | > loss: -0.52809  (-0.57088)
     | > log_mle: -0.63935  (-0.66663)
     | > loss_dur: 0.11126  (0.09575)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.76365  (11.76371)
     | > current_lr: 0.00018 
     | > step_time: 0.74170  (0.67341)
     | > loader_time: 0.47040  (0.41318)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[91m 0.45321 [0m(+0.02568)
     | > avg_log_mle:[91m -0.40363 [0m(+0.00594)
     | > avg_loss_dur:[91m 0.85684 [0m(+0.01974)


[4m[1m > EPOCH: 716/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:41:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 12900[0m
     | > loss: -0.48887  (-0.54600)
     | > log_mle: -0.60981  (-0.64954)
     | > loss_dur: 0.12094  (0.10354)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.13235  (14.25531)
     | > current_lr: 0.00018 
     | > step_time: 0.91080  (0.71523)
     | > loader_time: 0.63360  (0.46303)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00400)
     | > avg_loss:[91m 0.47976 [0m(+0.02655)
     | > avg_log_mle:[92m -0.40501 [0m(-0.00138)
     | > avg_loss_dur:[91m 0.88477 [0m(+0.02793)


[4m[1m > EPOCH: 717/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:42:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00100)
     | > avg_loss:[92m 0.41785 [0m(-0.06190)
     | > avg_log_mle:[91m -0.40012 [0m(+0.00489)
     | > avg_loss_dur:[92m 0.81798 [0m(-0.06679)


[4m[1m > EPOCH: 718/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:42:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 12925[0m
     | > loss: -0.62116  (-0.62116)
     | > log_mle: -0.69945  (-0.69945)
     | > loss_dur: 0.07829  (0.07829)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.22881  (8.22881)
     | > current_lr: 0.00018 
     | > step_time: 0.64860  (0.64859)
     | > loader_time: 0.40040  (0.40036)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[92m 0.41574 [0m(-0.00212)
     | > avg_log_mle:[92m -0.40971 [0m(-0.00959)
     | > avg_loss_dur:[91m 0.82545 [0m(+0.00747)


[4m[1m > EPOCH: 719/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:43:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 12950[0m
     | > loss: -0.53126  (-0.55737)
     | > log_mle: -0.64286  (-0.65713)
     | > loss_dur: 0.11160  (0.09976)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.38031  (20.91577)
     | > current_lr: 0.00018 
     | > step_time: 0.68660  (0.66923)
     | > loader_time: 0.41540  (0.40637)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00300)
     | > avg_loss:[91m 0.46020 [0m(+0.04446)
     | > avg_log_mle:[92m -0.41154 [0m(-0.00182)
     | > avg_loss_dur:[91m 0.87173 [0m(+0.04628)


[4m[1m > EPOCH: 720/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:43:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 12975[0m
     | > loss: -0.46564  (-0.52932)
     | > log_mle: -0.58066  (-0.63284)
     | > loss_dur: 0.11501  (0.10351)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.75991  (17.71226)
     | > current_lr: 0.00018 
     | > step_time: 0.87580  (0.75195)
     | > loader_time: 0.55250  (0.46422)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.01001)
     | > avg_loss:[92m 0.42570 [0m(-0.03449)
     | > avg_log_mle:[91m -0.39156 [0m(+0.01998)
     | > avg_loss_dur:[92m 0.81726 [0m(-0.05447)


[4m[1m > EPOCH: 721/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:44:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.01001)
     | > avg_loss:[92m 0.41423 [0m(-0.01147)
     | > avg_log_mle:[92m -0.39810 [0m(-0.00654)
     | > avg_loss_dur:[92m 0.81234 [0m(-0.00493)


[4m[1m > EPOCH: 722/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:44:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 13000[0m
     | > loss: -0.55942  (-0.59271)
     | > log_mle: -0.65345  (-0.67640)
     | > loss_dur: 0.09403  (0.08369)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.37239  (25.12383)
     | > current_lr: 0.00018 
     | > step_time: 0.73170  (0.66160)
     | > loader_time: 0.50350  (0.41287)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00400)
     | > avg_loss:[91m 0.42863 [0m(+0.01440)
     | > avg_log_mle:[92m -0.40996 [0m(-0.01185)
     | > avg_loss_dur:[91m 0.83859 [0m(+0.02625)


[4m[1m > EPOCH: 723/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:45:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 13025[0m
     | > loss: -0.52365  (-0.55871)
     | > log_mle: -0.62943  (-0.65665)
     | > loss_dur: 0.10578  (0.09794)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.88938  (18.56227)
     | > current_lr: 0.00018 
     | > step_time: 0.74570  (0.69982)
     | > loader_time: 0.47140  (0.43203)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00200)
     | > avg_loss:[91m 0.46636 [0m(+0.03772)
     | > avg_log_mle:[91m -0.40459 [0m(+0.00536)
     | > avg_loss_dur:[91m 0.87095 [0m(+0.03236)


[4m[1m > EPOCH: 724/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:45:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00601)
     | > avg_loss:[91m 0.48824 [0m(+0.02188)
     | > avg_log_mle:[91m -0.39923 [0m(+0.00536)
     | > avg_loss_dur:[91m 0.88747 [0m(+0.01652)


[4m[1m > EPOCH: 725/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:46:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 13050[0m
     | > loss: -0.60825  (-0.60825)
     | > log_mle: -0.69362  (-0.69362)
     | > loss_dur: 0.08537  (0.08537)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.28543  (14.28543)
     | > current_lr: 0.00018 
     | > step_time: 0.50150  (0.50146)
     | > loader_time: 0.26620  (0.26624)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06606 [0m(+0.00100)
     | > avg_loss:[92m 0.42175 [0m(-0.06649)
     | > avg_log_mle:[92m -0.40789 [0m(-0.00866)
     | > avg_loss_dur:[92m 0.82964 [0m(-0.05783)


[4m[1m > EPOCH: 726/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:46:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 13075[0m
     | > loss: -0.54057  (-0.57819)
     | > log_mle: -0.64718  (-0.67315)
     | > loss_dur: 0.10662  (0.09496)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.44701  (18.42024)
     | > current_lr: 0.00018 
     | > step_time: 0.64660  (0.66661)
     | > loader_time: 0.40840  (0.41738)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00100)
     | > avg_loss:[92m 0.41480 [0m(-0.00695)
     | > avg_log_mle:[92m -0.40878 [0m(-0.00089)
     | > avg_loss_dur:[92m 0.82358 [0m(-0.00606)


[4m[1m > EPOCH: 727/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:47:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 13100[0m
     | > loss: -0.44617  (-0.54558)
     | > log_mle: -0.56962  (-0.64613)
     | > loss_dur: 0.12345  (0.10054)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.84463  (14.65714)
     | > current_lr: 0.00018 
     | > step_time: 1.01990  (0.74269)
     | > loader_time: 0.62660  (0.46293)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[91m 0.43339 [0m(+0.01859)
     | > avg_log_mle:[91m -0.39806 [0m(+0.01072)
     | > avg_loss_dur:[91m 0.83146 [0m(+0.00788)


[4m[1m > EPOCH: 728/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:47:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00400)
     | > avg_loss:[92m 0.38465 [0m(-0.04874)
     | > avg_log_mle:[92m -0.41165 [0m(-0.01359)
     | > avg_loss_dur:[92m 0.79630 [0m(-0.03516)


[4m[1m > EPOCH: 729/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:48:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 13125[0m
     | > loss: -0.61157  (-0.62826)
     | > log_mle: -0.69819  (-0.70487)
     | > loss_dur: 0.08662  (0.07660)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.84377  (15.39142)
     | > current_lr: 0.00018 
     | > step_time: 0.68960  (0.63558)
     | > loader_time: 0.38430  (0.36533)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00100)
     | > avg_loss:[91m 0.45145 [0m(+0.06679)
     | > avg_log_mle:[91m -0.40227 [0m(+0.00938)
     | > avg_loss_dur:[91m 0.85372 [0m(+0.05741)


[4m[1m > EPOCH: 730/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:48:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 13150[0m
     | > loss: -0.51731  (-0.57141)
     | > log_mle: -0.62143  (-0.66387)
     | > loss_dur: 0.10412  (0.09246)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.68438  (13.89767)
     | > current_lr: 0.00018 
     | > step_time: 0.69860  (0.69233)
     | > loader_time: 0.46640  (0.42659)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00701)
     | > avg_loss:[91m 0.48278 [0m(+0.03134)
     | > avg_log_mle:[91m -0.40099 [0m(+0.00128)
     | > avg_loss_dur:[91m 0.88377 [0m(+0.03006)


[4m[1m > EPOCH: 731/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:49:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 13175[0m
     | > loss: -0.47826  (-0.53392)
     | > log_mle: -0.58624  (-0.63648)
     | > loss_dur: 0.10797  (0.10256)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.88836  (23.03845)
     | > current_lr: 0.00018 
     | > step_time: 0.85080  (0.76805)
     | > loader_time: 0.40740  (0.49910)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00000)
     | > avg_loss:[92m 0.42053 [0m(-0.06226)
     | > avg_log_mle:[91m -0.39815 [0m(+0.00284)
     | > avg_loss_dur:[92m 0.81868 [0m(-0.06510)


[4m[1m > EPOCH: 732/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:50:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00200)
     | > avg_loss:[91m 0.43969 [0m(+0.01917)
     | > avg_log_mle:[92m -0.40462 [0m(-0.00647)
     | > avg_loss_dur:[91m 0.84431 [0m(+0.02563)


[4m[1m > EPOCH: 733/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:50:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 13200[0m
     | > loss: -0.52808  (-0.58196)
     | > log_mle: -0.63268  (-0.67240)
     | > loss_dur: 0.10460  (0.09044)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 27.99191  (21.08939)
     | > current_lr: 0.00018 
     | > step_time: 0.63860  (0.66694)
     | > loader_time: 0.38430  (0.40453)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[92m 0.35759 [0m(-0.08210)
     | > avg_log_mle:[92m -0.40486 [0m(-0.00024)
     | > avg_loss_dur:[92m 0.76245 [0m(-0.08186)


[4m[1m > EPOCH: 734/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:51:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 13225[0m
     | > loss: -0.49183  (-0.55140)
     | > log_mle: -0.60189  (-0.65098)
     | > loss_dur: 0.11005  (0.09957)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.04056  (11.92442)
     | > current_lr: 0.00018 
     | > step_time: 0.79170  (0.72143)
     | > loader_time: 0.49440  (0.44887)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00100)
     | > avg_loss:[91m 0.39885 [0m(+0.04126)
     | > avg_log_mle:[91m -0.39701 [0m(+0.00785)
     | > avg_loss_dur:[91m 0.79587 [0m(+0.03341)


[4m[1m > EPOCH: 735/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:51:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00601)
     | > avg_loss:[91m 0.48708 [0m(+0.08823)
     | > avg_log_mle:[91m -0.39250 [0m(+0.00451)
     | > avg_loss_dur:[91m 0.87958 [0m(+0.08372)


[4m[1m > EPOCH: 736/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:52:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 13250[0m
     | > loss: -0.60325  (-0.61449)
     | > log_mle: -0.69142  (-0.69823)
     | > loss_dur: 0.08817  (0.08374)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.87096  (10.90272)
     | > current_lr: 0.00018 
     | > step_time: 0.55950  (0.60655)
     | > loader_time: 0.31830  (0.35132)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.01101)
     | > avg_loss:[91m 0.50078 [0m(+0.01370)
     | > avg_log_mle:[91m -0.38861 [0m(+0.00389)
     | > avg_loss_dur:[91m 0.88939 [0m(+0.00981)


[4m[1m > EPOCH: 737/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:52:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 13275[0m
     | > loss: -0.53120  (-0.55775)
     | > log_mle: -0.63701  (-0.65838)
     | > loss_dur: 0.10581  (0.10064)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.17322  (11.80647)
     | > current_lr: 0.00018 
     | > step_time: 0.87280  (0.69107)
     | > loader_time: 0.57250  (0.44596)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00801)
     | > avg_loss:[92m 0.49961 [0m(-0.00117)
     | > avg_log_mle:[92m -0.40059 [0m(-0.01198)
     | > avg_loss_dur:[91m 0.90020 [0m(+0.01081)


[4m[1m > EPOCH: 738/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:53:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 13300[0m
     | > loss: -0.45945  (-0.53211)
     | > log_mle: -0.57396  (-0.63651)
     | > loss_dur: 0.11451  (0.10441)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.48580  (15.28858)
     | > current_lr: 0.00018 
     | > step_time: 0.96590  (0.76438)
     | > loader_time: 0.56350  (0.48957)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00300)
     | > avg_loss:[92m 0.47197 [0m(-0.02764)
     | > avg_log_mle:[91m -0.39748 [0m(+0.00311)
     | > avg_loss_dur:[92m 0.86945 [0m(-0.03075)


[4m[1m > EPOCH: 739/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:53:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00701)
     | > avg_loss:[92m 0.44649 [0m(-0.02548)
     | > avg_log_mle:[92m -0.39930 [0m(-0.00182)
     | > avg_loss_dur:[92m 0.84579 [0m(-0.02366)


[4m[1m > EPOCH: 740/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:54:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 13325[0m
     | > loss: -0.53930  (-0.59467)
     | > log_mle: -0.64467  (-0.68430)
     | > loss_dur: 0.10537  (0.08963)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 32.25629  (19.32673)
     | > current_lr: 0.00018 
     | > step_time: 0.74170  (0.67421)
     | > loader_time: 0.45440  (0.42178)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00200)
     | > avg_loss:[91m 0.47193 [0m(+0.02543)
     | > avg_log_mle:[91m -0.38991 [0m(+0.00938)
     | > avg_loss_dur:[91m 0.86184 [0m(+0.01605)


[4m[1m > EPOCH: 741/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:54:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 13350[0m
     | > loss: -0.50038  (-0.55060)
     | > log_mle: -0.61766  (-0.65350)
     | > loss_dur: 0.11728  (0.10290)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.24452  (13.90818)
     | > current_lr: 0.00019 
     | > step_time: 0.91180  (0.71432)
     | > loader_time: 0.61360  (0.45041)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00000)
     | > avg_loss:[92m 0.44791 [0m(-0.02402)
     | > avg_log_mle:[92m -0.40129 [0m(-0.01138)
     | > avg_loss_dur:[92m 0.84920 [0m(-0.01264)


[4m[1m > EPOCH: 742/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:55:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00100)
     | > avg_loss:[92m 0.38481 [0m(-0.06310)
     | > avg_log_mle:[91m -0.38202 [0m(+0.01927)
     | > avg_loss_dur:[92m 0.76683 [0m(-0.08237)


[4m[1m > EPOCH: 743/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:55:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 13375[0m
     | > loss: -0.63358  (-0.63358)
     | > log_mle: -0.71224  (-0.71224)
     | > loss_dur: 0.07865  (0.07865)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.89097  (7.89097)
     | > current_lr: 0.00019 
     | > step_time: 0.65460  (0.65460)
     | > loader_time: 0.36730  (0.36733)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00100)
     | > avg_loss:[91m 0.44580 [0m(+0.06099)
     | > avg_log_mle:[92m -0.40332 [0m(-0.02129)
     | > avg_loss_dur:[91m 0.84911 [0m(+0.08228)


[4m[1m > EPOCH: 744/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:56:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 13400[0m
     | > loss: -0.53080  (-0.57772)
     | > log_mle: -0.64176  (-0.67086)
     | > loss_dur: 0.11096  (0.09314)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.21229  (6.51620)
     | > current_lr: 0.00019 
     | > step_time: 0.68260  (0.66511)
     | > loader_time: 0.41540  (0.42789)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.06906 [0m(+0.00000)
     | > avg_loss:[91m 0.46874 [0m(+0.02294)
     | > avg_log_mle:[91m -0.38862 [0m(+0.01470)
     | > avg_loss_dur:[91m 0.85736 [0m(+0.00825)


[4m[1m > EPOCH: 745/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:56:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 13425[0m
     | > loss: -0.48030  (-0.53701)
     | > log_mle: -0.59632  (-0.64197)
     | > loss_dur: 0.11602  (0.10496)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.27851  (20.24664)
     | > current_lr: 0.00019 
     | > step_time: 0.88080  (0.75222)
     | > loader_time: 0.57850  (0.47543)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00200)
     | > avg_loss:[92m 0.46743 [0m(-0.00131)
     | > avg_log_mle:[92m -0.40445 [0m(-0.01583)
     | > avg_loss_dur:[91m 0.87188 [0m(+0.01452)


[4m[1m > EPOCH: 746/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:57:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00200)
     | > avg_loss:[92m 0.46149 [0m(-0.00594)
     | > avg_log_mle:[91m -0.37918 [0m(+0.02527)
     | > avg_loss_dur:[92m 0.84067 [0m(-0.03121)


[4m[1m > EPOCH: 747/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:57:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 13450[0m
     | > loss: -0.59147  (-0.60983)
     | > log_mle: -0.67705  (-0.69060)
     | > loss_dur: 0.08558  (0.08077)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.08936  (25.97325)
     | > current_lr: 0.00019 
     | > step_time: 0.73170  (0.65910)
     | > loader_time: 0.52150  (0.40637)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00300)
     | > avg_loss:[92m 0.42289 [0m(-0.03860)
     | > avg_log_mle:[92m -0.40211 [0m(-0.02293)
     | > avg_loss_dur:[92m 0.82500 [0m(-0.01568)


[4m[1m > EPOCH: 748/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:58:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 13475[0m
     | > loss: -0.54085  (-0.58657)
     | > log_mle: -0.63516  (-0.67544)
     | > loss_dur: 0.09431  (0.08887)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 28.65506  (14.98022)
     | > current_lr: 0.00019 
     | > step_time: 0.74170  (0.69709)
     | > loader_time: 0.48340  (0.44531)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[91m 0.43906 [0m(+0.01617)
     | > avg_log_mle:[91m -0.38921 [0m(+0.01290)
     | > avg_loss_dur:[91m 0.82827 [0m(+0.00327)


[4m[1m > EPOCH: 749/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:58:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00000)
     | > avg_loss:[92m 0.39729 [0m(-0.04177)
     | > avg_log_mle:[92m -0.39836 [0m(-0.00916)
     | > avg_loss_dur:[92m 0.79566 [0m(-0.03261)


[4m[1m > EPOCH: 750/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:59:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 13500[0m
     | > loss: -0.64684  (-0.64684)
     | > log_mle: -0.72681  (-0.72681)
     | > loss_dur: 0.07997  (0.07997)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.01335  (9.01335)
     | > current_lr: 0.00019 
     | > step_time: 0.68160  (0.68162)
     | > loader_time: 0.27820  (0.27824)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00300)
     | > avg_loss:[91m 0.43940 [0m(+0.04211)
     | > avg_log_mle:[91m -0.38021 [0m(+0.01815)
     | > avg_loss_dur:[91m 0.81961 [0m(+0.02396)


[4m[1m > EPOCH: 751/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 12:59:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 13525[0m
     | > loss: -0.56043  (-0.60591)
     | > log_mle: -0.66105  (-0.69100)
     | > loss_dur: 0.10062  (0.08509)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.12750  (16.78962)
     | > current_lr: 0.00019 
     | > step_time: 0.65460  (0.66746)
     | > loader_time: 0.43640  (0.41609)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00000)
     | > avg_loss:[91m 0.45830 [0m(+0.01890)
     | > avg_log_mle:[92m -0.39324 [0m(-0.01303)
     | > avg_loss_dur:[91m 0.85154 [0m(+0.03193)


[4m[1m > EPOCH: 752/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:00:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 13550[0m
     | > loss: -0.49360  (-0.55706)
     | > log_mle: -0.60418  (-0.65429)
     | > loss_dur: 0.11058  (0.09723)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.74504  (10.83766)
     | > current_lr: 0.00019 
     | > step_time: 1.02090  (0.74239)
     | > loader_time: 0.62860  (0.47400)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00300)
     | > avg_loss:[92m 0.45118 [0m(-0.00712)
     | > avg_log_mle:[91m -0.39312 [0m(+0.00012)
     | > avg_loss_dur:[92m 0.84430 [0m(-0.00724)


[4m[1m > EPOCH: 753/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:00:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[92m 0.40877 [0m(-0.04241)
     | > avg_log_mle:[91m -0.39245 [0m(+0.00066)
     | > avg_loss_dur:[92m 0.80123 [0m(-0.04307)


[4m[1m > EPOCH: 754/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:01:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 13575[0m
     | > loss: -0.63784  (-0.63906)
     | > log_mle: -0.71730  (-0.71553)
     | > loss_dur: 0.07946  (0.07647)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.29755  (13.72619)
     | > current_lr: 0.00019 
     | > step_time: 0.68760  (0.63458)
     | > loader_time: 0.41240  (0.38001)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00801)
     | > avg_loss:[92m 0.39231 [0m(-0.01646)
     | > avg_log_mle:[91m -0.38912 [0m(+0.00333)
     | > avg_loss_dur:[92m 0.78143 [0m(-0.01979)


[4m[1m > EPOCH: 755/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:02:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 13600[0m
     | > loss: -0.54531  (-0.58896)
     | > log_mle: -0.63979  (-0.67844)
     | > loss_dur: 0.09448  (0.08948)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.58504  (11.82837)
     | > current_lr: 0.00019 
     | > step_time: 0.70060  (0.69153)
     | > loader_time: 0.42640  (0.43169)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08207 [0m(+0.00600)
     | > avg_loss:[91m 0.42153 [0m(+0.02922)
     | > avg_log_mle:[91m -0.38236 [0m(+0.00676)
     | > avg_loss_dur:[91m 0.80389 [0m(+0.02246)


[4m[1m > EPOCH: 756/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:02:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 13625[0m
     | > loss: -0.46998  (-0.54930)
     | > log_mle: -0.58287  (-0.64780)
     | > loss_dur: 0.11289  (0.09850)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 51.95552  (12.39474)
     | > current_lr: 0.00019 
     | > step_time: 0.85280  (0.76693)
     | > loader_time: 0.44640  (0.46801)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.01301)
     | > avg_loss:[91m 0.43008 [0m(+0.00855)
     | > avg_log_mle:[91m -0.38054 [0m(+0.00182)
     | > avg_loss_dur:[91m 0.81062 [0m(+0.00673)


[4m[1m > EPOCH: 757/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:03:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00000)
     | > avg_loss:[92m 0.38375 [0m(-0.04633)
     | > avg_log_mle:[92m -0.39759 [0m(-0.01704)
     | > avg_loss_dur:[92m 0.78133 [0m(-0.02929)


[4m[1m > EPOCH: 758/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:03:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 13650[0m
     | > loss: -0.56361  (-0.61038)
     | > log_mle: -0.65314  (-0.69422)
     | > loss_dur: 0.08953  (0.08384)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.74413  (17.62333)
     | > current_lr: 0.00019 
     | > step_time: 0.63960  (0.66978)
     | > loader_time: 0.37430  (0.41421)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.06906 [0m(+0.00000)
     | > avg_loss:[91m 0.43746 [0m(+0.05372)
     | > avg_log_mle:[91m -0.38093 [0m(+0.01666)
     | > avg_loss_dur:[91m 0.81839 [0m(+0.03706)


[4m[1m > EPOCH: 759/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:04:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 13675[0m
     | > loss: -0.49546  (-0.58102)
     | > log_mle: -0.60504  (-0.67161)
     | > loss_dur: 0.10958  (0.09059)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.74392  (11.94647)
     | > current_lr: 0.00019 
     | > step_time: 0.78370  (0.71865)
     | > loader_time: 0.51550  (0.48613)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00500)
     | > avg_loss:[92m 0.43365 [0m(-0.00382)
     | > avg_log_mle:[92m -0.39845 [0m(-0.01752)
     | > avg_loss_dur:[91m 0.83210 [0m(+0.01370)


[4m[1m > EPOCH: 760/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:04:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00601)
     | > avg_loss:[91m 0.45387 [0m(+0.02022)
     | > avg_log_mle:[91m -0.39512 [0m(+0.00333)
     | > avg_loss_dur:[91m 0.84898 [0m(+0.01688)


[4m[1m > EPOCH: 761/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:05:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 13700[0m
     | > loss: -0.64272  (-0.64729)
     | > log_mle: -0.71720  (-0.72360)
     | > loss_dur: 0.07447  (0.07631)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.12486  (6.32839)
     | > current_lr: 0.00019 
     | > step_time: 0.56550  (0.60355)
     | > loader_time: 0.34830  (0.36133)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[92m 0.43186 [0m(-0.02201)
     | > avg_log_mle:[91m -0.39210 [0m(+0.00302)
     | > avg_loss_dur:[92m 0.82395 [0m(-0.02503)


[4m[1m > EPOCH: 762/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:05:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 13725[0m
     | > loss: -0.56757  (-0.58142)
     | > log_mle: -0.67296  (-0.67874)
     | > loss_dur: 0.10539  (0.09733)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.23645  (12.20556)
     | > current_lr: 0.00019 
     | > step_time: 0.87780  (0.69219)
     | > loader_time: 0.60860  (0.43595)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00500)
     | > avg_loss:[91m 0.49132 [0m(+0.05946)
     | > avg_log_mle:[91m -0.37768 [0m(+0.01442)
     | > avg_loss_dur:[91m 0.86900 [0m(+0.04504)


[4m[1m > EPOCH: 763/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:06:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 13750[0m
     | > loss: -0.49392  (-0.54131)
     | > log_mle: -0.60075  (-0.64821)
     | > loss_dur: 0.10683  (0.10689)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.29704  (17.09158)
     | > current_lr: 0.00019 
     | > step_time: 0.95190  (0.76276)
     | > loader_time: 0.60750  (0.49176)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00901)
     | > avg_loss:[92m 0.38646 [0m(-0.10486)
     | > avg_log_mle:[92m -0.39566 [0m(-0.01798)
     | > avg_loss_dur:[92m 0.78212 [0m(-0.08687)


[4m[1m > EPOCH: 764/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:06:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00000)
     | > avg_loss:[91m 0.41514 [0m(+0.02868)
     | > avg_log_mle:[91m -0.38095 [0m(+0.01471)
     | > avg_loss_dur:[91m 0.79609 [0m(+0.01397)


[4m[1m > EPOCH: 765/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:07:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 13775[0m
     | > loss: -0.55230  (-0.60410)
     | > log_mle: -0.64986  (-0.68863)
     | > loss_dur: 0.09756  (0.08453)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.85035  (11.01158)
     | > current_lr: 0.00019 
     | > step_time: 0.74970  (0.67582)
     | > loader_time: 0.43140  (0.41438)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00200)
     | > avg_loss:[91m 0.44206 [0m(+0.02692)
     | > avg_log_mle:[91m -0.38008 [0m(+0.00087)
     | > avg_loss_dur:[91m 0.82214 [0m(+0.02605)


[4m[1m > EPOCH: 766/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:07:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 13800[0m
     | > loss: -0.51072  (-0.56728)
     | > log_mle: -0.62240  (-0.66714)
     | > loss_dur: 0.11168  (0.09986)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.82747  (16.56776)
     | > current_lr: 0.00019 
     | > step_time: 0.92290  (0.71665)
     | > loader_time: 0.64960  (0.45533)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00500)
     | > avg_loss:[91m 0.47935 [0m(+0.03729)
     | > avg_log_mle:[92m -0.39050 [0m(-0.01041)
     | > avg_loss_dur:[91m 0.86985 [0m(+0.04770)


[4m[1m > EPOCH: 767/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:08:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01001)
     | > avg_loss:[91m 0.48774 [0m(+0.00839)
     | > avg_log_mle:[91m -0.38773 [0m(+0.00277)
     | > avg_loss_dur:[91m 0.87547 [0m(+0.00562)


[4m[1m > EPOCH: 768/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:08:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 13825[0m
     | > loss: -0.65390  (-0.65390)
     | > log_mle: -0.72626  (-0.72626)
     | > loss_dur: 0.07236  (0.07236)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.46311  (12.46311)
     | > current_lr: 0.00019 
     | > step_time: 0.64960  (0.64959)
     | > loader_time: 0.39140  (0.39136)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00500)
     | > avg_loss:[92m 0.47994 [0m(-0.00780)
     | > avg_log_mle:[92m -0.39615 [0m(-0.00843)
     | > avg_loss_dur:[91m 0.87609 [0m(+0.00063)


[4m[1m > EPOCH: 769/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:09:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 13850[0m
     | > loss: -0.56790  (-0.60305)
     | > log_mle: -0.66674  (-0.68883)
     | > loss_dur: 0.09884  (0.08579)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.86970  (15.78362)
     | > current_lr: 0.00019 
     | > step_time: 0.68360  (0.66661)
     | > loader_time: 0.40040  (0.41062)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00400)
     | > avg_loss:[92m 0.43831 [0m(-0.04163)
     | > avg_log_mle:[91m -0.38905 [0m(+0.00710)
     | > avg_loss_dur:[92m 0.82736 [0m(-0.04873)


[4m[1m > EPOCH: 770/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:09:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 13875[0m
     | > loss: -0.48460  (-0.56452)
     | > log_mle: -0.59621  (-0.66056)
     | > loss_dur: 0.11161  (0.09604)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.76077  (12.99526)
     | > current_lr: 0.00019 
     | > step_time: 0.87580  (0.74902)
     | > loader_time: 0.52750  (0.48103)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00300)
     | > avg_loss:[92m 0.42560 [0m(-0.01271)
     | > avg_log_mle:[91m -0.38629 [0m(+0.00277)
     | > avg_loss_dur:[92m 0.81189 [0m(-0.01548)


[4m[1m > EPOCH: 771/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:10:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00300)
     | > avg_loss:[92m 0.39977 [0m(-0.02583)
     | > avg_log_mle:[92m -0.38720 [0m(-0.00091)
     | > avg_loss_dur:[92m 0.78697 [0m(-0.02491)


[4m[1m > EPOCH: 772/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:10:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 13900[0m
     | > loss: -0.59770  (-0.62765)
     | > log_mle: -0.68770  (-0.70870)
     | > loss_dur: 0.09000  (0.08105)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.28054  (16.25763)
     | > current_lr: 0.00019 
     | > step_time: 0.73070  (0.65935)
     | > loader_time: 0.47940  (0.40161)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00500)
     | > avg_loss:[91m 0.43739 [0m(+0.03761)
     | > avg_log_mle:[91m -0.38626 [0m(+0.00094)
     | > avg_loss_dur:[91m 0.82364 [0m(+0.03667)


[4m[1m > EPOCH: 773/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:11:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 13925[0m
     | > loss: -0.56299  (-0.59956)
     | > log_mle: -0.65814  (-0.68855)
     | > loss_dur: 0.09515  (0.08900)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.67950  (16.82215)
     | > current_lr: 0.00019 
     | > step_time: 0.74170  (0.69782)
     | > loader_time: 0.47640  (0.44149)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.01101)
     | > avg_loss:[91m 0.43768 [0m(+0.00029)
     | > avg_log_mle:[92m -0.38656 [0m(-0.00030)
     | > avg_loss_dur:[91m 0.82424 [0m(+0.00059)


[4m[1m > EPOCH: 774/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:11:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00701)
     | > avg_loss:[92m 0.42497 [0m(-0.01271)
     | > avg_log_mle:[91m -0.38307 [0m(+0.00350)
     | > avg_loss_dur:[92m 0.80804 [0m(-0.01620)


[4m[1m > EPOCH: 775/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:12:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 13950[0m
     | > loss: -0.66838  (-0.66838)
     | > log_mle: -0.73897  (-0.73897)
     | > loss_dur: 0.07059  (0.07059)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.37896  (8.37896)
     | > current_lr: 0.00019 
     | > step_time: 0.49950  (0.49946)
     | > loader_time: 0.28130  (0.28125)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00500)
     | > avg_loss:[91m 0.43760 [0m(+0.01263)
     | > avg_log_mle:[91m -0.37230 [0m(+0.01077)
     | > avg_loss_dur:[91m 0.80990 [0m(+0.00187)


[4m[1m > EPOCH: 776/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:13:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 13975[0m
     | > loss: -0.57020  (-0.61204)
     | > log_mle: -0.65970  (-0.69554)
     | > loss_dur: 0.08950  (0.08350)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.37838  (12.43139)
     | > current_lr: 0.00019 
     | > step_time: 0.65160  (0.66518)
     | > loader_time: 0.43340  (0.42281)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00801)
     | > avg_loss:[92m 0.41177 [0m(-0.02583)
     | > avg_log_mle:[91m -0.37077 [0m(+0.00152)
     | > avg_loss_dur:[92m 0.78254 [0m(-0.02736)


[4m[1m > EPOCH: 777/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:13:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 14000[0m
     | > loss: -0.51306  (-0.57178)
     | > log_mle: -0.61296  (-0.66644)
     | > loss_dur: 0.09990  (0.09466)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.12513  (8.68126)
     | > current_lr: 0.00019 
     | > step_time: 1.01290  (0.74325)
     | > loader_time: 0.60050  (0.46892)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.01001)
     | > avg_loss:[91m 0.42174 [0m(+0.00997)
     | > avg_log_mle:[92m -0.38297 [0m(-0.01219)
     | > avg_loss_dur:[91m 0.80471 [0m(+0.02217)


[4m[1m > EPOCH: 778/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:14:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.01201)
     | > avg_loss:[91m 0.51565 [0m(+0.09390)
     | > avg_log_mle:[92m -0.38416 [0m(-0.00119)
     | > avg_loss_dur:[91m 0.89981 [0m(+0.09509)


[4m[1m > EPOCH: 779/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:14:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 14025[0m
     | > loss: -0.64544  (-0.65489)
     | > log_mle: -0.72762  (-0.73177)
     | > loss_dur: 0.08218  (0.07688)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.93832  (10.15504)
     | > current_lr: 0.00019 
     | > step_time: 0.68860  (0.63858)
     | > loader_time: 0.41940  (0.38035)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00400)
     | > avg_loss:[92m 0.44367 [0m(-0.07197)
     | > avg_log_mle:[92m -0.38618 [0m(-0.00202)
     | > avg_loss_dur:[92m 0.82985 [0m(-0.06995)


[4m[1m > EPOCH: 780/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:15:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 14050[0m
     | > loss: -0.56267  (-0.60595)
     | > log_mle: -0.66348  (-0.69549)
     | > loss_dur: 0.10081  (0.08954)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.43576  (16.54668)
     | > current_lr: 0.00019 
     | > step_time: 0.70160  (0.69353)
     | > loader_time: 0.42240  (0.42178)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00200)
     | > avg_loss:[92m 0.43981 [0m(-0.00386)
     | > avg_log_mle:[92m -0.38697 [0m(-0.00080)
     | > avg_loss_dur:[92m 0.82679 [0m(-0.00307)


[4m[1m > EPOCH: 781/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:15:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 14075[0m
     | > loss: -0.51354  (-0.57771)
     | > log_mle: -0.61238  (-0.66911)
     | > loss_dur: 0.09883  (0.09140)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.90649  (13.36358)
     | > current_lr: 0.00020 
     | > step_time: 0.84980  (0.76905)
     | > loader_time: 0.42840  (0.47555)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.01001)
     | > avg_loss:[92m 0.41188 [0m(-0.02793)
     | > avg_log_mle:[91m -0.38652 [0m(+0.00045)
     | > avg_loss_dur:[92m 0.79841 [0m(-0.02838)


[4m[1m > EPOCH: 782/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:16:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00100)
     | > avg_loss:[91m 0.48973 [0m(+0.07785)
     | > avg_log_mle:[91m -0.37623 [0m(+0.01030)
     | > avg_loss_dur:[91m 0.86596 [0m(+0.06755)


[4m[1m > EPOCH: 783/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:16:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 14100[0m
     | > loss: -0.56120  (-0.62988)
     | > log_mle: -0.65975  (-0.71126)
     | > loss_dur: 0.09855  (0.08137)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.23378  (12.24026)
     | > current_lr: 0.00020 
     | > step_time: 0.63960  (0.67194)
     | > loader_time: 0.39540  (0.46042)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06106 [0m(-0.01501)
     | > avg_loss:[92m 0.48744 [0m(-0.00229)
     | > avg_log_mle:[91m -0.37070 [0m(+0.00553)
     | > avg_loss_dur:[92m 0.85814 [0m(-0.00782)


[4m[1m > EPOCH: 784/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:17:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 14125[0m
     | > loss: -0.48816  (-0.58507)
     | > log_mle: -0.59822  (-0.67834)
     | > loss_dur: 0.11006  (0.09327)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.27316  (16.87410)
     | > current_lr: 0.00020 
     | > step_time: 0.80270  (0.72451)
     | > loader_time: 0.56750  (0.46604)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00901)
     | > avg_loss:[92m 0.44678 [0m(-0.04067)
     | > avg_log_mle:[92m -0.38146 [0m(-0.01076)
     | > avg_loss_dur:[92m 0.82824 [0m(-0.02991)


[4m[1m > EPOCH: 785/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:17:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00200)
     | > avg_loss:[91m 0.46723 [0m(+0.02045)
     | > avg_log_mle:[92m -0.38589 [0m(-0.00443)
     | > avg_loss_dur:[91m 0.85312 [0m(+0.02488)


[4m[1m > EPOCH: 786/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:18:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 14150[0m
     | > loss: -0.64042  (-0.66097)
     | > log_mle: -0.71856  (-0.73488)
     | > loss_dur: 0.07814  (0.07391)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.60879  (14.86380)
     | > current_lr: 0.00020 
     | > step_time: 0.56050  (0.60755)
     | > loader_time: 0.33830  (0.34431)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.49645 [0m(+0.02922)
     | > avg_log_mle:[91m -0.37549 [0m(+0.01040)
     | > avg_loss_dur:[91m 0.87194 [0m(+0.01882)


[4m[1m > EPOCH: 787/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:18:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 14175[0m
     | > loss: -0.60256  (-0.62515)
     | > log_mle: -0.69547  (-0.70926)
     | > loss_dur: 0.09291  (0.08411)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.59632  (11.50562)
     | > current_lr: 0.00020 
     | > step_time: 0.87280  (0.69330)
     | > loader_time: 0.61160  (0.44007)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00200)
     | > avg_loss:[91m 0.52367 [0m(+0.02721)
     | > avg_log_mle:[91m -0.36230 [0m(+0.01318)
     | > avg_loss_dur:[91m 0.88597 [0m(+0.01403)


[4m[1m > EPOCH: 788/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:19:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 14200[0m
     | > loss: -0.49429  (-0.57557)
     | > log_mle: -0.59717  (-0.66826)
     | > loss_dur: 0.10288  (0.09269)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.25687  (16.96442)
     | > current_lr: 0.00020 
     | > step_time: 0.95490  (0.76495)
     | > loader_time: 0.58250  (0.48262)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[92m 0.44031 [0m(-0.08336)
     | > avg_log_mle:[92m -0.37527 [0m(-0.01297)
     | > avg_loss_dur:[92m 0.81558 [0m(-0.07039)


[4m[1m > EPOCH: 789/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:19:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00200)
     | > avg_loss:[91m 0.49513 [0m(+0.05483)
     | > avg_log_mle:[91m -0.36964 [0m(+0.00563)
     | > avg_loss_dur:[91m 0.86477 [0m(+0.04919)


[4m[1m > EPOCH: 790/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:20:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 14225[0m
     | > loss: -0.58234  (-0.63741)
     | > log_mle: -0.67503  (-0.71514)
     | > loss_dur: 0.09269  (0.07773)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 28.58790  (27.89948)
     | > current_lr: 0.00020 
     | > step_time: 0.74070  (0.67762)
     | > loader_time: 0.53050  (0.45241)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00400)
     | > avg_loss:[92m 0.42226 [0m(-0.07287)
     | > avg_log_mle:[92m -0.38232 [0m(-0.01268)
     | > avg_loss_dur:[92m 0.80458 [0m(-0.06019)


[4m[1m > EPOCH: 791/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:20:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 14250[0m
     | > loss: -0.52044  (-0.59811)
     | > log_mle: -0.62747  (-0.68831)
     | > loss_dur: 0.10703  (0.09020)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.46192  (18.78621)
     | > current_lr: 0.00020 
     | > step_time: 0.91180  (0.71674)
     | > loader_time: 0.63960  (0.45992)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00400)
     | > avg_loss:[91m 0.42574 [0m(+0.00348)
     | > avg_log_mle:[91m -0.36958 [0m(+0.01274)
     | > avg_loss_dur:[92m 0.79532 [0m(-0.00926)


[4m[1m > EPOCH: 792/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:21:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06406 [0m(-0.00801)
     | > avg_loss:[91m 0.48581 [0m(+0.06006)
     | > avg_log_mle:[92m -0.37413 [0m(-0.00455)
     | > avg_loss_dur:[91m 0.85993 [0m(+0.06461)


[4m[1m > EPOCH: 793/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:21:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 14275[0m
     | > loss: -0.68782  (-0.68782)
     | > log_mle: -0.75668  (-0.75668)
     | > loss_dur: 0.06886  (0.06886)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.91657  (7.91657)
     | > current_lr: 0.00020 
     | > step_time: 0.65360  (0.65359)
     | > loader_time: 0.35330  (0.35332)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06506 [0m(+0.00100)
     | > avg_loss:[92m 0.45436 [0m(-0.03145)
     | > avg_log_mle:[91m -0.37323 [0m(+0.00090)
     | > avg_loss_dur:[92m 0.82759 [0m(-0.03235)


[4m[1m > EPOCH: 794/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:22:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 14300[0m
     | > loss: -0.59839  (-0.62100)
     | > log_mle: -0.69358  (-0.70506)
     | > loss_dur: 0.09519  (0.08405)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.67871  (12.94998)
     | > current_lr: 0.00020 
     | > step_time: 0.67560  (0.66686)
     | > loader_time: 0.42340  (0.41463)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00901)
     | > avg_loss:[91m 0.45784 [0m(+0.00348)
     | > avg_log_mle:[91m -0.35762 [0m(+0.01561)
     | > avg_loss_dur:[92m 0.81546 [0m(-0.01213)


[4m[1m > EPOCH: 795/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:22:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 14325[0m
     | > loss: -0.47588  (-0.58024)
     | > log_mle: -0.58876  (-0.67345)
     | > loss_dur: 0.11288  (0.09321)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 46.07416  (14.55527)
     | > current_lr: 0.00020 
     | > step_time: 0.88380  (0.75343)
     | > loader_time: 0.53250  (0.47264)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00501)
     | > avg_loss:[91m 0.49881 [0m(+0.04098)
     | > avg_log_mle:[92m -0.36476 [0m(-0.00714)
     | > avg_loss_dur:[91m 0.86357 [0m(+0.04811)


[4m[1m > EPOCH: 796/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:23:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00200)
     | > avg_loss:[92m 0.40892 [0m(-0.08990)
     | > avg_log_mle:[92m -0.37792 [0m(-0.01316)
     | > avg_loss_dur:[92m 0.78684 [0m(-0.07673)


[4m[1m > EPOCH: 797/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:23:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 14350[0m
     | > loss: -0.62394  (-0.64812)
     | > log_mle: -0.71211  (-0.72858)
     | > loss_dur: 0.08817  (0.08045)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.96178  (10.72120)
     | > current_lr: 0.00020 
     | > step_time: 0.73270  (0.65935)
     | > loader_time: 0.48040  (0.39936)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00801)
     | > avg_loss:[91m 0.43066 [0m(+0.02175)
     | > avg_log_mle:[91m -0.37472 [0m(+0.00320)
     | > avg_loss_dur:[91m 0.80538 [0m(+0.01854)


[4m[1m > EPOCH: 798/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:24:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 14375[0m
     | > loss: -0.59009  (-0.60288)
     | > log_mle: -0.68258  (-0.69537)
     | > loss_dur: 0.09249  (0.09249)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.32475  (18.95296)
     | > current_lr: 0.00020 
     | > step_time: 0.74370  (0.69763)
     | > loader_time: 0.48240  (0.44331)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00701)
     | > avg_loss:[91m 0.45148 [0m(+0.02082)
     | > avg_log_mle:[91m -0.36663 [0m(+0.00809)
     | > avg_loss_dur:[91m 0.81812 [0m(+0.01273)


[4m[1m > EPOCH: 799/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:25:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[91m 0.52538 [0m(+0.07390)
     | > avg_log_mle:[91m -0.36163 [0m(+0.00500)
     | > avg_loss_dur:[91m 0.88701 [0m(+0.06890)


[4m[1m > EPOCH: 800/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:25:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 14400[0m
     | > loss: -0.65301  (-0.65301)
     | > log_mle: -0.72783  (-0.72783)
     | > loss_dur: 0.07482  (0.07482)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 30.96430  (30.96430)
     | > current_lr: 0.00020 
     | > step_time: 0.63660  (0.63658)
     | > loader_time: 0.27320  (0.27325)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00601)
     | > avg_loss:[92m 0.42930 [0m(-0.09608)
     | > avg_log_mle:[92m -0.37304 [0m(-0.01141)
     | > avg_loss_dur:[92m 0.80234 [0m(-0.08468)


[4m[1m > EPOCH: 801/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:26:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 14425[0m
     | > loss: -0.60333  (-0.61916)
     | > log_mle: -0.69272  (-0.70509)
     | > loss_dur: 0.08939  (0.08593)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.55589  (13.20723)
     | > current_lr: 0.00020 
     | > step_time: 0.64960  (0.66847)
     | > loader_time: 0.39240  (0.40508)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00200)
     | > avg_loss:[91m 0.43597 [0m(+0.00667)
     | > avg_log_mle:[91m -0.37169 [0m(+0.00135)
     | > avg_loss_dur:[91m 0.80766 [0m(+0.00532)


[4m[1m > EPOCH: 802/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:26:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 14450[0m
     | > loss: -0.51640  (-0.57911)
     | > log_mle: -0.62287  (-0.67490)
     | > loss_dur: 0.10647  (0.09578)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.51390  (13.74572)
     | > current_lr: 0.00020 
     | > step_time: 1.02590  (0.74304)
     | > loader_time: 0.62360  (0.47221)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.00601)
     | > avg_loss:[91m 0.45240 [0m(+0.01644)
     | > avg_log_mle:[92m -0.37230 [0m(-0.00062)
     | > avg_loss_dur:[91m 0.82471 [0m(+0.01705)


[4m[1m > EPOCH: 803/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:27:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.01001)
     | > avg_loss:[92m 0.44422 [0m(-0.00819)
     | > avg_log_mle:[91m -0.35807 [0m(+0.01423)
     | > avg_loss_dur:[92m 0.80229 [0m(-0.02242)


[4m[1m > EPOCH: 804/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:27:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 14475[0m
     | > loss: -0.65437  (-0.66110)
     | > log_mle: -0.74021  (-0.73942)
     | > loss_dur: 0.08583  (0.07833)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.11369  (12.31876)
     | > current_lr: 0.00020 
     | > step_time: 0.68960  (0.63424)
     | > loader_time: 0.42240  (0.38068)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.06906 [0m(+0.00000)
     | > avg_loss:[91m 0.54695 [0m(+0.10274)
     | > avg_log_mle:[92m -0.36688 [0m(-0.00880)
     | > avg_loss_dur:[91m 0.91383 [0m(+0.11154)


[4m[1m > EPOCH: 805/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:28:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 14500[0m
     | > loss: -0.59779  (-0.60532)
     | > log_mle: -0.68697  (-0.69755)
     | > loss_dur: 0.08918  (0.09224)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.92764  (18.88890)
     | > current_lr: 0.00020 
     | > step_time: 0.70260  (0.69313)
     | > loader_time: 0.49240  (0.44560)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00300)
     | > avg_loss:[92m 0.46110 [0m(-0.08585)
     | > avg_log_mle:[92m -0.37516 [0m(-0.00829)
     | > avg_loss_dur:[92m 0.83626 [0m(-0.07757)


[4m[1m > EPOCH: 806/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:28:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 14525[0m
     | > loss: -0.51279  (-0.58597)
     | > log_mle: -0.60700  (-0.67583)
     | > loss_dur: 0.09421  (0.08986)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.97748  (14.57359)
     | > current_lr: 0.00020 
     | > step_time: 0.84780  (0.76852)
     | > loader_time: 0.48240  (0.48874)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00400)
     | > avg_loss:[92m 0.42215 [0m(-0.03895)
     | > avg_log_mle:[91m -0.35798 [0m(+0.01718)
     | > avg_loss_dur:[92m 0.78013 [0m(-0.05613)


[4m[1m > EPOCH: 807/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:29:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00801)
     | > avg_loss:[91m 0.44389 [0m(+0.02174)
     | > avg_log_mle:[92m -0.36110 [0m(-0.00312)
     | > avg_loss_dur:[91m 0.80499 [0m(+0.02486)


[4m[1m > EPOCH: 808/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:29:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 14550[0m
     | > loss: -0.55875  (-0.62284)
     | > log_mle: -0.66282  (-0.70758)
     | > loss_dur: 0.10407  (0.08474)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.50930  (18.93210)
     | > current_lr: 0.00020 
     | > step_time: 0.64060  (0.66777)
     | > loader_time: 0.37530  (0.41638)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00901)
     | > avg_loss:[92m 0.41297 [0m(-0.03092)
     | > avg_log_mle:[92m -0.36788 [0m(-0.00677)
     | > avg_loss_dur:[92m 0.78085 [0m(-0.02414)


[4m[1m > EPOCH: 809/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:30:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 14575[0m
     | > loss: -0.52782  (-0.59677)
     | > log_mle: -0.62709  (-0.68525)
     | > loss_dur: 0.09927  (0.08848)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 33.06394  (14.61742)
     | > current_lr: 0.00020 
     | > step_time: 0.78670  (0.72150)
     | > loader_time: 0.49950  (0.46203)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00601)
     | > avg_loss:[91m 0.47355 [0m(+0.06058)
     | > avg_log_mle:[91m -0.35736 [0m(+0.01052)
     | > avg_loss_dur:[91m 0.83091 [0m(+0.05006)


[4m[1m > EPOCH: 810/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:30:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00300)
     | > avg_loss:[91m 0.49390 [0m(+0.02036)
     | > avg_log_mle:[92m -0.36468 [0m(-0.00732)
     | > avg_loss_dur:[91m 0.85858 [0m(+0.02767)


[4m[1m > EPOCH: 811/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:31:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 14600[0m
     | > loss: -0.67279  (-0.68172)
     | > log_mle: -0.74726  (-0.75249)
     | > loss_dur: 0.07447  (0.07077)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.95861  (9.78588)
     | > current_lr: 0.00020 
     | > step_time: 0.56350  (0.60805)
     | > loader_time: 0.33130  (0.36033)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00400)
     | > avg_loss:[92m 0.37065 [0m(-0.12325)
     | > avg_log_mle:[92m -0.36822 [0m(-0.00354)
     | > avg_loss_dur:[92m 0.73887 [0m(-0.11971)


[4m[1m > EPOCH: 812/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:31:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 14625[0m
     | > loss: -0.58374  (-0.59806)
     | > log_mle: -0.67569  (-0.68978)
     | > loss_dur: 0.09195  (0.09172)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.08755  (18.55065)
     | > current_lr: 0.00020 
     | > step_time: 0.87680  (0.69107)
     | > loader_time: 0.56050  (0.45719)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00100)
     | > avg_loss:[91m 0.48746 [0m(+0.11681)
     | > avg_log_mle:[92m -0.37008 [0m(-0.00186)
     | > avg_loss_dur:[91m 0.85754 [0m(+0.11867)


[4m[1m > EPOCH: 813/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:32:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 14650[0m
     | > loss: -0.47835  (-0.56194)
     | > log_mle: -0.59311  (-0.66245)
     | > loss_dur: 0.11476  (0.10051)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.27293  (17.59485)
     | > current_lr: 0.00020 
     | > step_time: 0.95090  (0.76345)
     | > loader_time: 0.61460  (0.49176)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06105 [0m(-0.01201)
     | > avg_loss:[92m 0.47421 [0m(-0.01325)
     | > avg_log_mle:[92m -0.37020 [0m(-0.00012)
     | > avg_loss_dur:[92m 0.84441 [0m(-0.01313)


[4m[1m > EPOCH: 814/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:32:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06406 [0m(+0.00300)
     | > avg_loss:[92m 0.44716 [0m(-0.02705)
     | > avg_log_mle:[92m -0.37129 [0m(-0.00109)
     | > avg_loss_dur:[92m 0.81845 [0m(-0.02596)


[4m[1m > EPOCH: 815/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:33:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 14675[0m
     | > loss: -0.56905  (-0.63671)
     | > log_mle: -0.67363  (-0.72145)
     | > loss_dur: 0.10458  (0.08475)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.70860  (13.72397)
     | > current_lr: 0.00020 
     | > step_time: 0.74070  (0.67241)
     | > loader_time: 0.47140  (0.41798)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00901)
     | > avg_loss:[91m 0.45060 [0m(+0.00344)
     | > avg_log_mle:[92m -0.37391 [0m(-0.00262)
     | > avg_loss_dur:[91m 0.82451 [0m(+0.00606)


[4m[1m > EPOCH: 816/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:33:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 14700[0m
     | > loss: -0.52554  (-0.58384)
     | > log_mle: -0.63389  (-0.68080)
     | > loss_dur: 0.10835  (0.09697)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.13434  (16.27620)
     | > current_lr: 0.00020 
     | > step_time: 0.91380  (0.71282)
     | > loader_time: 0.67760  (0.45266)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00601)
     | > avg_loss:[91m 0.46594 [0m(+0.01534)
     | > avg_log_mle:[91m -0.35925 [0m(+0.01466)
     | > avg_loss_dur:[91m 0.82519 [0m(+0.00068)


[4m[1m > EPOCH: 817/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:34:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00601)
     | > avg_loss:[92m 0.40843 [0m(-0.05751)
     | > avg_log_mle:[91m -0.35314 [0m(+0.00611)
     | > avg_loss_dur:[92m 0.76158 [0m(-0.06362)


[4m[1m > EPOCH: 818/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:34:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 14725[0m
     | > loss: -0.68509  (-0.68509)
     | > log_mle: -0.75773  (-0.75773)
     | > loss_dur: 0.07264  (0.07264)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.75027  (6.75027)
     | > current_lr: 0.00020 
     | > step_time: 0.65260  (0.65259)
     | > loader_time: 0.37130  (0.37134)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00100)
     | > avg_loss:[91m 0.45694 [0m(+0.04850)
     | > avg_log_mle:[92m -0.36284 [0m(-0.00970)
     | > avg_loss_dur:[91m 0.81978 [0m(+0.05820)


[4m[1m > EPOCH: 819/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:35:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 14750[0m
     | > loss: -0.57002  (-0.61903)
     | > log_mle: -0.67765  (-0.70683)
     | > loss_dur: 0.10763  (0.08780)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.27473  (13.59415)
     | > current_lr: 0.00020 
     | > step_time: 0.67960  (0.67111)
     | > loader_time: 0.38330  (0.40624)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00500)
     | > avg_loss:[91m 0.45773 [0m(+0.00079)
     | > avg_log_mle:[92m -0.37006 [0m(-0.00722)
     | > avg_loss_dur:[91m 0.82779 [0m(+0.00801)


[4m[1m > EPOCH: 820/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:35:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 14775[0m
     | > loss: -0.51025  (-0.59586)
     | > log_mle: -0.61601  (-0.68564)
     | > loss_dur: 0.10576  (0.08978)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.99416  (18.81331)
     | > current_lr: 0.00020 
     | > step_time: 0.87280  (0.75294)
     | > loader_time: 0.51950  (0.47590)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00601)
     | > avg_loss:[91m 0.48968 [0m(+0.03195)
     | > avg_log_mle:[91m -0.36084 [0m(+0.00922)
     | > avg_loss_dur:[91m 0.85052 [0m(+0.02273)


[4m[1m > EPOCH: 821/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:36:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00701)
     | > avg_loss:[92m 0.43712 [0m(-0.05256)
     | > avg_log_mle:[91m -0.34720 [0m(+0.01364)
     | > avg_loss_dur:[92m 0.78432 [0m(-0.06620)


[4m[1m > EPOCH: 822/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:36:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 14800[0m
     | > loss: -0.63939  (-0.67030)
     | > log_mle: -0.71705  (-0.74262)
     | > loss_dur: 0.07767  (0.07232)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 3.59900  (6.50777)
     | > current_lr: 0.00021 
     | > step_time: 0.72770  (0.65585)
     | > loader_time: 0.48440  (0.41137)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.01301)
     | > avg_loss:[91m 0.47071 [0m(+0.03359)
     | > avg_log_mle:[92m -0.35651 [0m(-0.00931)
     | > avg_loss_dur:[91m 0.82722 [0m(+0.04289)


[4m[1m > EPOCH: 823/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:37:28) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 14825[0m
     | > loss: -0.54583  (-0.60676)
     | > log_mle: -0.64653  (-0.69666)
     | > loss_dur: 0.10069  (0.08990)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.01034  (16.30964)
     | > current_lr: 0.00021 
     | > step_time: 0.74370  (0.69536)
     | > loader_time: 0.43140  (0.42775)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.01702)
     | > avg_loss:[92m 0.45725 [0m(-0.01345)
     | > avg_log_mle:[92m -0.36293 [0m(-0.00642)
     | > avg_loss_dur:[92m 0.82018 [0m(-0.00704)


[4m[1m > EPOCH: 824/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:37:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00801)
     | > avg_loss:[92m 0.44924 [0m(-0.00801)
     | > avg_log_mle:[91m -0.36040 [0m(+0.00252)
     | > avg_loss_dur:[92m 0.80965 [0m(-0.01053)


[4m[1m > EPOCH: 825/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:38:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 14850[0m
     | > loss: -0.68645  (-0.68645)
     | > log_mle: -0.76016  (-0.76016)
     | > loss_dur: 0.07372  (0.07372)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.02216  (14.02216)
     | > current_lr: 0.00021 
     | > step_time: 0.50150  (0.50146)
     | > loader_time: 0.28330  (0.28326)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[91m 0.54544 [0m(+0.09619)
     | > avg_log_mle:[91m -0.32704 [0m(+0.03337)
     | > avg_loss_dur:[91m 0.87247 [0m(+0.06282)


[4m[1m > EPOCH: 826/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:39:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 14875[0m
     | > loss: -0.54585  (-0.59170)
     | > log_mle: -0.66327  (-0.68998)
     | > loss_dur: 0.11743  (0.09827)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.76017  (21.35505)
     | > current_lr: 0.00021 
     | > step_time: 0.65060  (0.66718)
     | > loader_time: 0.40640  (0.39693)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00200)
     | > avg_loss:[92m 0.45637 [0m(-0.08907)
     | > avg_log_mle:[92m -0.36337 [0m(-0.03634)
     | > avg_loss_dur:[92m 0.81974 [0m(-0.05273)


[4m[1m > EPOCH: 827/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:39:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 14900[0m
     | > loss: -0.52274  (-0.58790)
     | > log_mle: -0.62563  (-0.68455)
     | > loss_dur: 0.10290  (0.09665)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 34.58789  (19.12130)
     | > current_lr: 0.00021 
     | > step_time: 1.02790  (0.74225)
     | > loader_time: 0.65660  (0.47450)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00701)
     | > avg_loss:[92m 0.45008 [0m(-0.00630)
     | > avg_log_mle:[91m -0.35035 [0m(+0.01303)
     | > avg_loss_dur:[92m 0.80042 [0m(-0.01932)


[4m[1m > EPOCH: 828/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:40:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00500)
     | > avg_loss:[91m 0.47825 [0m(+0.02818)
     | > avg_log_mle:[92m -0.35742 [0m(-0.00707)
     | > avg_loss_dur:[91m 0.83567 [0m(+0.03525)


[4m[1m > EPOCH: 829/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:40:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 14925[0m
     | > loss: -0.67594  (-0.67283)
     | > log_mle: -0.75549  (-0.75085)
     | > loss_dur: 0.07955  (0.07803)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 16.30056  (11.85546)
     | > current_lr: 0.00021 
     | > step_time: 0.68660  (0.63324)
     | > loader_time: 0.40740  (0.37334)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00300)
     | > avg_loss:[92m 0.46534 [0m(-0.01292)
     | > avg_log_mle:[92m -0.36202 [0m(-0.00460)
     | > avg_loss_dur:[92m 0.82736 [0m(-0.00831)


[4m[1m > EPOCH: 830/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:41:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 14950[0m
     | > loss: -0.57845  (-0.61589)
     | > log_mle: -0.67804  (-0.70490)
     | > loss_dur: 0.09959  (0.08902)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 12.80150  (15.87262)
     | > current_lr: 0.00021 
     | > step_time: 0.70760  (0.69734)
     | > loader_time: 0.45140  (0.42479)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06806 [0m(+0.00300)
     | > avg_loss:[92m 0.43463 [0m(-0.03071)
     | > avg_log_mle:[91m -0.34568 [0m(+0.01635)
     | > avg_loss_dur:[92m 0.78030 [0m(-0.04706)


[4m[1m > EPOCH: 831/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:41:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 14975[0m
     | > loss: -0.51092  (-0.58426)
     | > log_mle: -0.61025  (-0.67471)
     | > loss_dur: 0.09933  (0.09045)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 14.43618  (14.29982)
     | > current_lr: 0.00021 
     | > step_time: 0.84380  (0.77094)
     | > loader_time: 0.41840  (0.48709)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00200)
     | > avg_loss:[91m 0.49054 [0m(+0.05591)
     | > avg_log_mle:[92m -0.36759 [0m(-0.02191)
     | > avg_loss_dur:[91m 0.85812 [0m(+0.07782)


[4m[1m > EPOCH: 832/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:42:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[92m 0.44351 [0m(-0.04702)
     | > avg_log_mle:[91m -0.36039 [0m(+0.00720)
     | > avg_loss_dur:[92m 0.80390 [0m(-0.05422)


[4m[1m > EPOCH: 833/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:42:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 15000[0m
     | > loss: -0.57391  (-0.64591)
     | > log_mle: -0.67056  (-0.72741)
     | > loss_dur: 0.09665  (0.08150)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 3.99949  (11.68250)
     | > current_lr: 0.00021 
     | > step_time: 0.63060  (0.67144)
     | > loader_time: 0.41040  (0.41221)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00601)
     | > avg_loss:[91m 0.44647 [0m(+0.00296)
     | > avg_log_mle:[91m -0.36004 [0m(+0.00035)
     | > avg_loss_dur:[91m 0.80652 [0m(+0.00261)


[4m[1m > EPOCH: 834/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:43:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 15025[0m
     | > loss: -0.51524  (-0.60786)
     | > log_mle: -0.62362  (-0.69883)
     | > loss_dur: 0.10838  (0.09096)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 16.69197  (11.65651)
     | > current_lr: 0.00021 
     | > step_time: 0.78770  (0.71989)
     | > loader_time: 0.49950  (0.44510)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00400)
     | > avg_loss:[91m 0.47429 [0m(+0.02782)
     | > avg_log_mle:[91m -0.34074 [0m(+0.01930)
     | > avg_loss_dur:[91m 0.81503 [0m(+0.00852)


[4m[1m > EPOCH: 835/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:43:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00600)
     | > avg_loss:[92m 0.42948 [0m(-0.04481)
     | > avg_log_mle:[92m -0.35110 [0m(-0.01036)
     | > avg_loss_dur:[92m 0.78058 [0m(-0.03445)


[4m[1m > EPOCH: 836/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:44:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 15050[0m
     | > loss: -0.67596  (-0.68391)
     | > log_mle: -0.74495  (-0.75192)
     | > loss_dur: 0.06899  (0.06801)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.75730  (10.85001)
     | > current_lr: 0.00021 
     | > step_time: 0.56250  (0.60405)
     | > loader_time: 0.32430  (0.35732)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00701)
     | > avg_loss:[91m 0.43769 [0m(+0.00820)
     | > avg_log_mle:[91m -0.34627 [0m(+0.00483)
     | > avg_loss_dur:[91m 0.78396 [0m(+0.00337)


[4m[1m > EPOCH: 837/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:44:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 15075[0m
     | > loss: -0.62556  (-0.63839)
     | > log_mle: -0.71947  (-0.72341)
     | > loss_dur: 0.09391  (0.08503)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.67726  (12.80918)
     | > current_lr: 0.00021 
     | > step_time: 0.87280  (0.69141)
     | > loader_time: 0.58750  (0.42894)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00000)
     | > avg_loss:[91m 0.47118 [0m(+0.03349)
     | > avg_log_mle:[92m -0.35735 [0m(-0.01108)
     | > avg_loss_dur:[91m 0.82853 [0m(+0.04458)


[4m[1m > EPOCH: 838/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:45:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 15100[0m
     | > loss: -0.52323  (-0.60337)
     | > log_mle: -0.62134  (-0.69297)
     | > loss_dur: 0.09811  (0.08960)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.19679  (13.55624)
     | > current_lr: 0.00021 
     | > step_time: 0.95590  (0.76338)
     | > loader_time: 0.59650  (0.48963)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00100)
     | > avg_loss:[92m 0.45048 [0m(-0.02070)
     | > avg_log_mle:[91m -0.35303 [0m(+0.00433)
     | > avg_loss_dur:[92m 0.80351 [0m(-0.02502)


[4m[1m > EPOCH: 839/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:45:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00400)
     | > avg_loss:[91m 0.46785 [0m(+0.01737)
     | > avg_log_mle:[91m -0.34669 [0m(+0.00634)
     | > avg_loss_dur:[91m 0.81454 [0m(+0.01103)


[4m[1m > EPOCH: 840/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:46:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 15125[0m
     | > loss: -0.60205  (-0.66197)
     | > log_mle: -0.69312  (-0.74183)
     | > loss_dur: 0.09108  (0.07986)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.22991  (16.73130)
     | > current_lr: 0.00021 
     | > step_time: 0.74470  (0.67562)
     | > loader_time: 0.44240  (0.41918)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00601)
     | > avg_loss:[91m 0.50924 [0m(+0.04139)
     | > avg_log_mle:[91m -0.34453 [0m(+0.00216)
     | > avg_loss_dur:[91m 0.85377 [0m(+0.03923)


[4m[1m > EPOCH: 841/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:46:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 15150[0m
     | > loss: -0.55155  (-0.62395)
     | > log_mle: -0.64521  (-0.70892)
     | > loss_dur: 0.09366  (0.08497)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.41237  (14.30981)
     | > current_lr: 0.00021 
     | > step_time: 0.91580  (0.71482)
     | > loader_time: 0.62660  (0.45324)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00300)
     | > avg_loss:[92m 0.38715 [0m(-0.12209)
     | > avg_log_mle:[92m -0.34612 [0m(-0.00159)
     | > avg_loss_dur:[92m 0.73328 [0m(-0.12050)


[4m[1m > EPOCH: 842/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:47:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[91m 0.43887 [0m(+0.05171)
     | > avg_log_mle:[92m -0.34834 [0m(-0.00221)
     | > avg_loss_dur:[91m 0.78721 [0m(+0.05393)


[4m[1m > EPOCH: 843/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:47:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 15175[0m
     | > loss: -0.72308  (-0.72308)
     | > log_mle: -0.79130  (-0.79130)
     | > loss_dur: 0.06821  (0.06821)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.72669  (12.72669)
     | > current_lr: 0.00021 
     | > step_time: 0.65260  (0.65259)
     | > loader_time: 0.37430  (0.37434)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00300)
     | > avg_loss:[91m 0.48540 [0m(+0.04653)
     | > avg_log_mle:[91m -0.34672 [0m(+0.00162)
     | > avg_loss_dur:[91m 0.83212 [0m(+0.04491)


[4m[1m > EPOCH: 844/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:48:20) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 15200[0m
     | > loss: -0.60596  (-0.65178)
     | > log_mle: -0.69963  (-0.73385)
     | > loss_dur: 0.09368  (0.08208)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.56300  (15.65805)
     | > current_lr: 0.00021 
     | > step_time: 0.67860  (0.66848)
     | > loader_time: 0.44740  (0.41613)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00100)
     | > avg_loss:[92m 0.39873 [0m(-0.08668)
     | > avg_log_mle:[92m -0.34746 [0m(-0.00075)
     | > avg_loss_dur:[92m 0.74619 [0m(-0.08593)


[4m[1m > EPOCH: 845/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:48:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 15225[0m
     | > loss: -0.51126  (-0.61702)
     | > log_mle: -0.61134  (-0.70165)
     | > loss_dur: 0.10008  (0.08463)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.56248  (12.76551)
     | > current_lr: 0.00021 
     | > step_time: 0.87180  (0.75056)
     | > loader_time: 0.53350  (0.51713)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[91m 0.46926 [0m(+0.07054)
     | > avg_log_mle:[91m -0.33531 [0m(+0.01215)
     | > avg_loss_dur:[91m 0.80458 [0m(+0.05839)


[4m[1m > EPOCH: 846/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:49:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00400)
     | > avg_loss:[91m 0.49577 [0m(+0.02651)
     | > avg_log_mle:[92m -0.34943 [0m(-0.01411)
     | > avg_loss_dur:[91m 0.84520 [0m(+0.04062)


[4m[1m > EPOCH: 847/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:49:53) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 15250[0m
     | > loss: -0.63866  (-0.69013)
     | > log_mle: -0.71841  (-0.75873)
     | > loss_dur: 0.07975  (0.06860)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.96857  (17.73183)
     | > current_lr: 0.00021 
     | > step_time: 0.72870  (0.65860)
     | > loader_time: 0.52150  (0.39161)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00300)
     | > avg_loss:[91m 0.53356 [0m(+0.03779)
     | > avg_log_mle:[91m -0.34722 [0m(+0.00221)
     | > avg_loss_dur:[91m 0.88078 [0m(+0.03558)


[4m[1m > EPOCH: 848/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:50:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 15275[0m
     | > loss: -0.60094  (-0.64792)
     | > log_mle: -0.69258  (-0.72762)
     | > loss_dur: 0.09164  (0.07970)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.55553  (14.23417)
     | > current_lr: 0.00021 
     | > step_time: 0.73870  (0.69618)
     | > loader_time: 0.43040  (0.43312)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00100)
     | > avg_loss:[92m 0.48144 [0m(-0.05212)
     | > avg_log_mle:[91m -0.34349 [0m(+0.00372)
     | > avg_loss_dur:[92m 0.82493 [0m(-0.05585)


[4m[1m > EPOCH: 849/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:50:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00500)
     | > avg_loss:[92m 0.47019 [0m(-0.01125)
     | > avg_log_mle:[91m -0.33020 [0m(+0.01330)
     | > avg_loss_dur:[92m 0.80038 [0m(-0.02455)


[4m[1m > EPOCH: 850/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:51:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 15300[0m
     | > loss: -0.72843  (-0.72843)
     | > log_mle: -0.79007  (-0.79007)
     | > loss_dur: 0.06164  (0.06164)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.54956  (22.54956)
     | > current_lr: 0.00021 
     | > step_time: 0.60860  (0.60855)
     | > loader_time: 0.27520  (0.27525)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.01301)
     | > avg_loss:[92m 0.45492 [0m(-0.01527)
     | > avg_log_mle:[92m -0.34506 [0m(-0.01486)
     | > avg_loss_dur:[92m 0.79998 [0m(-0.00041)


[4m[1m > EPOCH: 851/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:51:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 15325[0m
     | > loss: -0.60147  (-0.64627)
     | > log_mle: -0.69353  (-0.72635)
     | > loss_dur: 0.09206  (0.08008)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 21.01768  (16.09582)
     | > current_lr: 0.00021 
     | > step_time: 0.64860  (0.66775)
     | > loader_time: 0.41040  (0.40951)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.01101)
     | > avg_loss:[91m 0.46384 [0m(+0.00892)
     | > avg_log_mle:[91m -0.34290 [0m(+0.00216)
     | > avg_loss_dur:[91m 0.80674 [0m(+0.00677)


[4m[1m > EPOCH: 852/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:52:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 15350[0m
     | > loss: -0.55126  (-0.61152)
     | > log_mle: -0.64549  (-0.70152)
     | > loss_dur: 0.09424  (0.09000)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.40854  (13.55304)
     | > current_lr: 0.00021 
     | > step_time: 1.02690  (0.74189)
     | > loader_time: 0.62160  (0.47157)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00601)
     | > avg_loss:[92m 0.39770 [0m(-0.06614)
     | > avg_log_mle:[91m -0.33941 [0m(+0.00350)
     | > avg_loss_dur:[92m 0.73710 [0m(-0.06964)


[4m[1m > EPOCH: 853/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:52:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07307 [0m(+0.00000)
     | > avg_loss:[92m 0.38266 [0m(-0.01504)
     | > avg_log_mle:[91m -0.32868 [0m(+0.01073)
     | > avg_loss_dur:[92m 0.71134 [0m(-0.02577)


[4m[1m > EPOCH: 854/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:53:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 15375[0m
     | > loss: -0.70817  (-0.71329)
     | > log_mle: -0.77882  (-0.78023)
     | > loss_dur: 0.07064  (0.06694)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.05544  (10.20055)
     | > current_lr: 0.00021 
     | > step_time: 0.68960  (0.63324)
     | > loader_time: 0.59250  (0.44140)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00400)
     | > avg_loss:[91m 0.41836 [0m(+0.03571)
     | > avg_log_mle:[92m -0.33770 [0m(-0.00902)
     | > avg_loss_dur:[91m 0.75606 [0m(+0.04473)


[4m[1m > EPOCH: 855/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:54:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 15400[0m
     | > loss: -0.60178  (-0.64046)
     | > log_mle: -0.69197  (-0.72309)
     | > loss_dur: 0.09019  (0.08262)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.87399  (20.64668)
     | > current_lr: 0.00021 
     | > step_time: 0.70360  (0.69393)
     | > loader_time: 0.43640  (0.43660)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00300)
     | > avg_loss:[91m 0.47239 [0m(+0.05403)
     | > avg_log_mle:[92m -0.33880 [0m(-0.00110)
     | > avg_loss_dur:[91m 0.81120 [0m(+0.05513)


[4m[1m > EPOCH: 856/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:54:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 15425[0m
     | > loss: -0.52455  (-0.60370)
     | > log_mle: -0.62266  (-0.69132)
     | > loss_dur: 0.09811  (0.08762)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.75007  (22.48484)
     | > current_lr: 0.00021 
     | > step_time: 0.84780  (0.76776)
     | > loader_time: 0.44940  (0.48650)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[92m 0.46285 [0m(-0.00954)
     | > avg_log_mle:[92m -0.33924 [0m(-0.00044)
     | > avg_loss_dur:[92m 0.80209 [0m(-0.00910)


[4m[1m > EPOCH: 857/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:55:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00701)
     | > avg_loss:[92m 0.44226 [0m(-0.02059)
     | > avg_log_mle:[91m -0.31726 [0m(+0.02198)
     | > avg_loss_dur:[92m 0.75953 [0m(-0.04257)


[4m[1m > EPOCH: 858/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:55:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 15450[0m
     | > loss: -0.58614  (-0.67358)
     | > log_mle: -0.67976  (-0.74776)
     | > loss_dur: 0.09363  (0.07417)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.17107  (11.28912)
     | > current_lr: 0.00021 
     | > step_time: 0.63660  (0.66727)
     | > loader_time: 0.35630  (0.40854)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07607 [0m(-0.00100)
     | > avg_loss:[91m 0.45249 [0m(+0.01023)
     | > avg_log_mle:[92m -0.33669 [0m(-0.01942)
     | > avg_loss_dur:[91m 0.78918 [0m(+0.02965)


[4m[1m > EPOCH: 859/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:56:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 15475[0m
     | > loss: -0.51297  (-0.61093)
     | > log_mle: -0.62218  (-0.70024)
     | > loss_dur: 0.10921  (0.08931)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.47374  (13.64504)
     | > current_lr: 0.00021 
     | > step_time: 0.78670  (0.72350)
     | > loader_time: 0.50750  (0.46458)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00901)
     | > avg_loss:[92m 0.43716 [0m(-0.01533)
     | > avg_log_mle:[92m -0.34397 [0m(-0.00728)
     | > avg_loss_dur:[92m 0.78113 [0m(-0.00805)


[4m[1m > EPOCH: 860/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:56:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00300)
     | > avg_loss:[92m 0.41515 [0m(-0.02201)
     | > avg_log_mle:[91m -0.34156 [0m(+0.00241)
     | > avg_loss_dur:[92m 0.75671 [0m(-0.02441)


[4m[1m > EPOCH: 861/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:57:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 15500[0m
     | > loss: -0.67968  (-0.70760)
     | > log_mle: -0.75239  (-0.77486)
     | > loss_dur: 0.07271  (0.06726)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.23719  (16.80154)
     | > current_lr: 0.00022 
     | > step_time: 0.56150  (0.60605)
     | > loader_time: 0.33230  (0.36333)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00601)
     | > avg_loss:[91m 0.46033 [0m(+0.04517)
     | > avg_log_mle:[91m -0.34154 [0m(+0.00002)
     | > avg_loss_dur:[91m 0.80187 [0m(+0.04515)


[4m[1m > EPOCH: 862/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:57:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 15525[0m
     | > loss: -0.63068  (-0.63958)
     | > log_mle: -0.71590  (-0.72299)
     | > loss_dur: 0.08522  (0.08342)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.63947  (12.94260)
     | > current_lr: 0.00022 
     | > step_time: 0.87780  (0.69196)
     | > loader_time: 0.58750  (0.42628)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00400)
     | > avg_loss:[92m 0.40889 [0m(-0.05143)
     | > avg_log_mle:[92m -0.34811 [0m(-0.00657)
     | > avg_loss_dur:[92m 0.75700 [0m(-0.04486)


[4m[1m > EPOCH: 863/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:58:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 15550[0m
     | > loss: -0.54140  (-0.60890)
     | > log_mle: -0.63940  (-0.69909)
     | > loss_dur: 0.09800  (0.09019)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.73982  (20.54797)
     | > current_lr: 0.00022 
     | > step_time: 0.95090  (0.76219)
     | > loader_time: 0.60250  (0.49877)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.41676 [0m(+0.00787)
     | > avg_log_mle:[91m -0.34347 [0m(+0.00464)
     | > avg_loss_dur:[91m 0.76023 [0m(+0.00323)


[4m[1m > EPOCH: 864/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:58:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00601)
     | > avg_loss:[91m 0.45224 [0m(+0.03548)
     | > avg_log_mle:[91m -0.33824 [0m(+0.00523)
     | > avg_loss_dur:[91m 0.79048 [0m(+0.03025)


[4m[1m > EPOCH: 865/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:59:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 15575[0m
     | > loss: -0.61767  (-0.68399)
     | > log_mle: -0.70295  (-0.75656)
     | > loss_dur: 0.08528  (0.07257)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.07529  (11.32773)
     | > current_lr: 0.00022 
     | > step_time: 0.74170  (0.67381)
     | > loader_time: 0.47440  (0.41277)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.01001)
     | > avg_loss:[92m 0.44425 [0m(-0.00800)
     | > avg_log_mle:[91m -0.33713 [0m(+0.00112)
     | > avg_loss_dur:[92m 0.78137 [0m(-0.00911)


[4m[1m > EPOCH: 866/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 13:59:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 15600[0m
     | > loss: -0.54207  (-0.63529)
     | > log_mle: -0.65164  (-0.72034)
     | > loss_dur: 0.10957  (0.08505)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.62325  (15.07719)
     | > current_lr: 0.00022 
     | > step_time: 0.91380  (0.71448)
     | > loader_time: 0.60250  (0.45808)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00701)
     | > avg_loss:[92m 0.42813 [0m(-0.01612)
     | > avg_log_mle:[92m -0.33888 [0m(-0.00176)
     | > avg_loss_dur:[92m 0.76701 [0m(-0.01436)


[4m[1m > EPOCH: 867/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:00:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00801)
     | > avg_loss:[91m 0.46459 [0m(+0.03646)
     | > avg_log_mle:[91m -0.33031 [0m(+0.00858)
     | > avg_loss_dur:[91m 0.79490 [0m(+0.02789)


[4m[1m > EPOCH: 868/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:00:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 15625[0m
     | > loss: -0.72925  (-0.72925)
     | > log_mle: -0.79753  (-0.79753)
     | > loss_dur: 0.06828  (0.06828)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.86438  (18.86438)
     | > current_lr: 0.00022 
     | > step_time: 0.65860  (0.65860)
     | > loader_time: 0.35730  (0.35732)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00100)
     | > avg_loss:[91m 0.50073 [0m(+0.03614)
     | > avg_log_mle:[91m -0.32267 [0m(+0.00764)
     | > avg_loss_dur:[91m 0.82340 [0m(+0.02850)


[4m[1m > EPOCH: 869/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:01:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 15650[0m
     | > loss: -0.59030  (-0.65358)
     | > log_mle: -0.68984  (-0.73558)
     | > loss_dur: 0.09954  (0.08201)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 26.42424  (14.18125)
     | > current_lr: 0.00022 
     | > step_time: 0.67960  (0.66823)
     | > loader_time: 0.40040  (0.41087)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00200)
     | > avg_loss:[92m 0.49101 [0m(-0.00972)
     | > avg_log_mle:[92m -0.33075 [0m(-0.00809)
     | > avg_loss_dur:[92m 0.82176 [0m(-0.00163)


[4m[1m > EPOCH: 870/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:01:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 15675[0m
     | > loss: -0.52799  (-0.60524)
     | > log_mle: -0.62797  (-0.69576)
     | > loss_dur: 0.09999  (0.09052)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.23297  (11.86052)
     | > current_lr: 0.00022 
     | > step_time: 0.87780  (0.75122)
     | > loader_time: 0.55850  (0.48417)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[92m 0.45570 [0m(-0.03532)
     | > avg_log_mle:[92m -0.34691 [0m(-0.01616)
     | > avg_loss_dur:[92m 0.80261 [0m(-0.01915)


[4m[1m > EPOCH: 871/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:02:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00300)
     | > avg_loss:[91m 0.50608 [0m(+0.05038)
     | > avg_log_mle:[91m -0.33787 [0m(+0.00904)
     | > avg_loss_dur:[91m 0.84395 [0m(+0.04134)


[4m[1m > EPOCH: 872/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:02:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 15700[0m
     | > loss: -0.67344  (-0.70488)
     | > log_mle: -0.74688  (-0.77603)
     | > loss_dur: 0.07345  (0.07115)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.22862  (14.43762)
     | > current_lr: 0.00022 
     | > step_time: 0.73670  (0.65835)
     | > loader_time: 0.50050  (0.41688)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00701)
     | > avg_loss:[91m 0.52102 [0m(+0.01494)
     | > avg_log_mle:[91m -0.32521 [0m(+0.01266)
     | > avg_loss_dur:[91m 0.84623 [0m(+0.00228)


[4m[1m > EPOCH: 873/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:03:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 15725[0m
     | > loss: -0.58113  (-0.64468)
     | > log_mle: -0.68114  (-0.73015)
     | > loss_dur: 0.10001  (0.08548)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.03575  (20.47659)
     | > current_lr: 0.00022 
     | > step_time: 0.73970  (0.69627)
     | > loader_time: 0.47440  (0.44477)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[92m 0.45104 [0m(-0.06997)
     | > avg_log_mle:[92m -0.32735 [0m(-0.00213)
     | > avg_loss_dur:[92m 0.77839 [0m(-0.06784)


[4m[1m > EPOCH: 874/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:03:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00600)
     | > avg_loss:[91m 0.50193 [0m(+0.05089)
     | > avg_log_mle:[92m -0.32769 [0m(-0.00035)
     | > avg_loss_dur:[91m 0.82963 [0m(+0.05124)


[4m[1m > EPOCH: 875/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:04:24) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 15750[0m
     | > loss: -0.74485  (-0.74485)
     | > log_mle: -0.80336  (-0.80336)
     | > loss_dur: 0.05850  (0.05850)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.55868  (20.55868)
     | > current_lr: 0.00022 
     | > step_time: 0.50050  (0.50046)
     | > loader_time: 0.27630  (0.27625)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00601)
     | > avg_loss:[92m 0.46658 [0m(-0.03535)
     | > avg_log_mle:[92m -0.33058 [0m(-0.00288)
     | > avg_loss_dur:[92m 0.79716 [0m(-0.03247)


[4m[1m > EPOCH: 876/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:04:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 15775[0m
     | > loss: -0.65518  (-0.69119)
     | > log_mle: -0.73506  (-0.76377)
     | > loss_dur: 0.07989  (0.07258)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.40322  (13.91427)
     | > current_lr: 0.00022 
     | > step_time: 0.65060  (0.66661)
     | > loader_time: 0.42840  (0.41638)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00501)
     | > avg_loss:[92m 0.46197 [0m(-0.00462)
     | > avg_log_mle:[92m -0.33482 [0m(-0.00424)
     | > avg_loss_dur:[92m 0.79679 [0m(-0.00037)


[4m[1m > EPOCH: 877/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:05:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 15800[0m
     | > loss: -0.57034  (-0.63697)
     | > log_mle: -0.66236  (-0.72237)
     | > loss_dur: 0.09202  (0.08540)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.47089  (14.50571)
     | > current_lr: 0.00022 
     | > step_time: 1.02490  (0.74425)
     | > loader_time: 0.65260  (0.47393)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[91m 0.49364 [0m(+0.03167)
     | > avg_log_mle:[91m -0.32847 [0m(+0.00635)
     | > avg_loss_dur:[91m 0.82211 [0m(+0.02532)


[4m[1m > EPOCH: 878/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:05:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00300)
     | > avg_loss:[92m 0.47748 [0m(-0.01616)
     | > avg_log_mle:[92m -0.33613 [0m(-0.00766)
     | > avg_loss_dur:[92m 0.81361 [0m(-0.00850)


[4m[1m > EPOCH: 879/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:06:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 15825[0m
     | > loss: -0.70437  (-0.71990)
     | > log_mle: -0.77944  (-0.78941)
     | > loss_dur: 0.07507  (0.06951)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.76214  (10.73210)
     | > current_lr: 0.00022 
     | > step_time: 0.69160  (0.63725)
     | > loader_time: 0.45240  (0.40303)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00701)
     | > avg_loss:[91m 0.53450 [0m(+0.05702)
     | > avg_log_mle:[91m -0.32705 [0m(+0.00907)
     | > avg_loss_dur:[91m 0.86155 [0m(+0.04795)


[4m[1m > EPOCH: 880/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:07:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 15850[0m
     | > loss: -0.61648  (-0.65459)
     | > log_mle: -0.70038  (-0.73608)
     | > loss_dur: 0.08390  (0.08149)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.48788  (22.96488)
     | > current_lr: 0.00022 
     | > step_time: 0.69960  (0.69263)
     | > loader_time: 0.44240  (0.46522)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.01301)
     | > avg_loss:[92m 0.47849 [0m(-0.05601)
     | > avg_log_mle:[92m -0.33481 [0m(-0.00776)
     | > avg_loss_dur:[92m 0.81330 [0m(-0.04826)


[4m[1m > EPOCH: 881/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:07:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 15875[0m
     | > loss: -0.56030  (-0.60775)
     | > log_mle: -0.64840  (-0.69698)
     | > loss_dur: 0.08810  (0.08923)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.75526  (14.39655)
     | > current_lr: 0.00022 
     | > step_time: 0.85880  (0.77253)
     | > loader_time: 0.46240  (0.49080)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07507 [0m(-0.00400)
     | > avg_loss:[91m 0.48351 [0m(+0.00502)
     | > avg_log_mle:[91m -0.32972 [0m(+0.00509)
     | > avg_loss_dur:[92m 0.81323 [0m(-0.00007)


[4m[1m > EPOCH: 882/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:08:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07407 [0m(-0.00100)
     | > avg_loss:[92m 0.45892 [0m(-0.02459)
     | > avg_log_mle:[92m -0.33142 [0m(-0.00170)
     | > avg_loss_dur:[92m 0.79034 [0m(-0.02289)


[4m[1m > EPOCH: 883/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:08:36) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 15900[0m
     | > loss: -0.61346  (-0.67388)
     | > log_mle: -0.70814  (-0.75426)
     | > loss_dur: 0.09467  (0.08038)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.14764  (20.97292)
     | > current_lr: 0.00022 
     | > step_time: 0.63760  (0.66994)
     | > loader_time: 0.39340  (0.41037)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00801)
     | > avg_loss:[91m 0.50443 [0m(+0.04550)
     | > avg_log_mle:[91m -0.32792 [0m(+0.00350)
     | > avg_loss_dur:[91m 0.83234 [0m(+0.04200)


[4m[1m > EPOCH: 884/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:09:07) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 15925[0m
     | > loss: -0.55389  (-0.64334)
     | > log_mle: -0.65047  (-0.72627)
     | > loss_dur: 0.09657  (0.08294)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.58749  (16.88134)
     | > current_lr: 0.00022 
     | > step_time: 0.78670  (0.72135)
     | > loader_time: 0.54050  (0.46881)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.01101)
     | > avg_loss:[92m 0.49044 [0m(-0.01398)
     | > avg_log_mle:[91m -0.32237 [0m(+0.00555)
     | > avg_loss_dur:[92m 0.81281 [0m(-0.01954)


[4m[1m > EPOCH: 885/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:09:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.01001)
     | > avg_loss:[92m 0.46408 [0m(-0.02636)
     | > avg_log_mle:[92m -0.33126 [0m(-0.00889)
     | > avg_loss_dur:[92m 0.79534 [0m(-0.01747)


[4m[1m > EPOCH: 886/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:10:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 15950[0m
     | > loss: -0.70508  (-0.72461)
     | > log_mle: -0.77539  (-0.79032)
     | > loss_dur: 0.07031  (0.06571)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.81234  (13.43363)
     | > current_lr: 0.00022 
     | > step_time: 0.56450  (0.60855)
     | > loader_time: 0.35430  (0.36333)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00701)
     | > avg_loss:[92m 0.45882 [0m(-0.00526)
     | > avg_log_mle:[91m -0.32450 [0m(+0.00675)
     | > avg_loss_dur:[92m 0.78333 [0m(-0.01201)


[4m[1m > EPOCH: 887/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:10:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 15975[0m
     | > loss: -0.64577  (-0.65439)
     | > log_mle: -0.73396  (-0.73558)
     | > loss_dur: 0.08819  (0.08119)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.56525  (17.23002)
     | > current_lr: 0.00022 
     | > step_time: 0.86880  (0.69041)
     | > loader_time: 0.55650  (0.46420)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00300)
     | > avg_loss:[91m 0.49760 [0m(+0.03878)
     | > avg_log_mle:[91m -0.31543 [0m(+0.00907)
     | > avg_loss_dur:[91m 0.81303 [0m(+0.02971)


[4m[1m > EPOCH: 888/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:11:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 16000[0m
     | > loss: -0.54648  (-0.61559)
     | > log_mle: -0.63694  (-0.70119)
     | > loss_dur: 0.09046  (0.08560)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.06877  (13.95194)
     | > current_lr: 0.00022 
     | > step_time: 0.95690  (0.76395)
     | > loader_time: 0.62560  (0.49320)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08007 [0m(+0.00901)
     | > avg_loss:[92m 0.49041 [0m(-0.00719)
     | > avg_log_mle:[92m -0.32168 [0m(-0.00624)
     | > avg_loss_dur:[92m 0.81209 [0m(-0.00095)


[4m[1m > EPOCH: 889/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:11:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00901)
     | > avg_loss:[92m 0.48078 [0m(-0.00963)
     | > avg_log_mle:[92m -0.32523 [0m(-0.00355)
     | > avg_loss_dur:[92m 0.80600 [0m(-0.00608)


[4m[1m > EPOCH: 890/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:12:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 16025[0m
     | > loss: -0.61795  (-0.68792)
     | > log_mle: -0.70907  (-0.76491)
     | > loss_dur: 0.09112  (0.07699)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.13624  (16.02973)
     | > current_lr: 0.00022 
     | > step_time: 0.74170  (0.68122)
     | > loader_time: 0.44940  (0.41177)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00300)
     | > avg_loss:[92m 0.45771 [0m(-0.02307)
     | > avg_log_mle:[91m -0.30404 [0m(+0.02119)
     | > avg_loss_dur:[92m 0.76175 [0m(-0.04425)


[4m[1m > EPOCH: 891/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:12:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 16050[0m
     | > loss: -0.58246  (-0.64739)
     | > log_mle: -0.67768  (-0.73035)
     | > loss_dur: 0.09522  (0.08296)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.23308  (10.92929)
     | > current_lr: 0.00022 
     | > step_time: 0.91680  (0.71398)
     | > loader_time: 0.69960  (0.46309)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00300)
     | > avg_loss:[91m 0.48347 [0m(+0.02576)
     | > avg_log_mle:[92m -0.32009 [0m(-0.01604)
     | > avg_loss_dur:[91m 0.80356 [0m(+0.04181)


[4m[1m > EPOCH: 892/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:13:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00100)
     | > avg_loss:[91m 0.50711 [0m(+0.02364)
     | > avg_log_mle:[92m -0.32172 [0m(-0.00163)
     | > avg_loss_dur:[91m 0.82883 [0m(+0.02527)


[4m[1m > EPOCH: 893/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:13:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 16075[0m
     | > loss: -0.74826  (-0.74826)
     | > log_mle: -0.81196  (-0.81196)
     | > loss_dur: 0.06370  (0.06370)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.10049  (16.10049)
     | > current_lr: 0.00022 
     | > step_time: 0.65160  (0.65159)
     | > loader_time: 0.39340  (0.39336)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[92m 0.46978 [0m(-0.03733)
     | > avg_log_mle:[91m -0.31687 [0m(+0.00484)
     | > avg_loss_dur:[92m 0.78666 [0m(-0.04217)


[4m[1m > EPOCH: 894/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:14:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 16100[0m
     | > loss: -0.59806  (-0.65342)
     | > log_mle: -0.69995  (-0.73632)
     | > loss_dur: 0.10189  (0.08290)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.25919  (21.65272)
     | > current_lr: 0.00022 
     | > step_time: 0.67960  (0.66761)
     | > loader_time: 0.38640  (0.42113)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00300)
     | > avg_loss:[91m 0.47116 [0m(+0.00138)
     | > avg_log_mle:[92m -0.32001 [0m(-0.00314)
     | > avg_loss_dur:[91m 0.79117 [0m(+0.00452)


[4m[1m > EPOCH: 895/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:14:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 16125[0m
     | > loss: -0.56626  (-0.63268)
     | > log_mle: -0.65988  (-0.71724)
     | > loss_dur: 0.09363  (0.08456)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.97642  (19.18474)
     | > current_lr: 0.00022 
     | > step_time: 0.87480  (0.75135)
     | > loader_time: 0.52950  (0.47029)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00200)
     | > avg_loss:[91m 0.52089 [0m(+0.04973)
     | > avg_log_mle:[91m -0.31780 [0m(+0.00221)
     | > avg_loss_dur:[91m 0.83869 [0m(+0.04752)


[4m[1m > EPOCH: 896/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:15:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00501)
     | > avg_loss:[91m 0.55088 [0m(+0.02999)
     | > avg_log_mle:[91m -0.30432 [0m(+0.01348)
     | > avg_loss_dur:[91m 0.85520 [0m(+0.01651)


[4m[1m > EPOCH: 897/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:15:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 16150[0m
     | > loss: -0.65602  (-0.71624)
     | > log_mle: -0.73797  (-0.78534)
     | > loss_dur: 0.08194  (0.06910)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.71099  (12.78245)
     | > current_lr: 0.00022 
     | > step_time: 0.73070  (0.65785)
     | > loader_time: 0.50050  (0.40937)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00000)
     | > avg_loss:[92m 0.51931 [0m(-0.03157)
     | > avg_log_mle:[92m -0.31228 [0m(-0.00796)
     | > avg_loss_dur:[92m 0.83159 [0m(-0.02361)


[4m[1m > EPOCH: 898/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:16:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 16175[0m
     | > loss: -0.64429  (-0.67050)
     | > log_mle: -0.72808  (-0.74751)
     | > loss_dur: 0.08379  (0.07702)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.65685  (14.66362)
     | > current_lr: 0.00022 
     | > step_time: 0.73870  (0.69554)
     | > loader_time: 0.44540  (0.43467)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00100)
     | > avg_loss:[92m 0.51144 [0m(-0.00787)
     | > avg_log_mle:[91m -0.31151 [0m(+0.00077)
     | > avg_loss_dur:[92m 0.82295 [0m(-0.00864)


[4m[1m > EPOCH: 899/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:16:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[92m 0.42385 [0m(-0.08759)
     | > avg_log_mle:[91m -0.31127 [0m(+0.00024)
     | > avg_loss_dur:[92m 0.73512 [0m(-0.08783)


[4m[1m > EPOCH: 900/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:17:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 16200[0m
     | > loss: -0.77295  (-0.77295)
     | > log_mle: -0.82798  (-0.82798)
     | > loss_dur: 0.05503  (0.05503)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 25.03582  (25.03582)
     | > current_lr: 0.00022 
     | > step_time: 0.67160  (0.67161)
     | > loader_time: 0.26920  (0.26923)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00601)
     | > avg_loss:[91m 0.43791 [0m(+0.01406)
     | > avg_log_mle:[92m -0.31718 [0m(-0.00591)
     | > avg_loss_dur:[91m 0.75509 [0m(+0.01998)


[4m[1m > EPOCH: 901/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:18:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 16225[0m
     | > loss: -0.61377  (-0.68326)
     | > log_mle: -0.70915  (-0.75992)
     | > loss_dur: 0.09538  (0.07666)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.27888  (9.00313)
     | > current_lr: 0.00023 
     | > step_time: 0.65160  (0.66604)
     | > loader_time: 0.37030  (0.40966)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00100)
     | > avg_loss:[91m 0.53157 [0m(+0.09366)
     | > avg_log_mle:[91m -0.31649 [0m(+0.00069)
     | > avg_loss_dur:[91m 0.84806 [0m(+0.09297)


[4m[1m > EPOCH: 902/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:18:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 16250[0m
     | > loss: -0.57739  (-0.63840)
     | > log_mle: -0.66454  (-0.72160)
     | > loss_dur: 0.08714  (0.08320)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.12916  (14.88515)
     | > current_lr: 0.00023 
     | > step_time: 1.01690  (0.74046)
     | > loader_time: 0.68260  (0.48601)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06306 [0m(-0.00601)
     | > avg_loss:[92m 0.48389 [0m(-0.04769)
     | > avg_log_mle:[91m -0.31441 [0m(+0.00208)
     | > avg_loss_dur:[92m 0.79830 [0m(-0.04977)


[4m[1m > EPOCH: 903/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:19:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00801)
     | > avg_loss:[91m 0.50713 [0m(+0.02324)
     | > avg_log_mle:[92m -0.31813 [0m(-0.00372)
     | > avg_loss_dur:[91m 0.82526 [0m(+0.02696)


[4m[1m > EPOCH: 904/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:19:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 16275[0m
     | > loss: -0.68302  (-0.72232)
     | > log_mle: -0.77013  (-0.79580)
     | > loss_dur: 0.08711  (0.07348)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.94942  (9.64130)
     | > current_lr: 0.00023 
     | > step_time: 0.69060  (0.63525)
     | > loader_time: 0.39340  (0.37768)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00100)
     | > avg_loss:[92m 0.46250 [0m(-0.04462)
     | > avg_log_mle:[92m -0.32501 [0m(-0.00688)
     | > avg_loss_dur:[92m 0.78751 [0m(-0.03775)


[4m[1m > EPOCH: 905/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:20:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 16300[0m
     | > loss: -0.61662  (-0.67109)
     | > log_mle: -0.70969  (-0.75329)
     | > loss_dur: 0.09307  (0.08220)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 19.98818  (10.23958)
     | > current_lr: 0.00023 
     | > step_time: 0.72270  (0.69403)
     | > loader_time: 0.46140  (0.44180)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00400)
     | > avg_loss:[91m 0.50099 [0m(+0.03849)
     | > avg_log_mle:[91m -0.28403 [0m(+0.04098)
     | > avg_loss_dur:[92m 0.78502 [0m(-0.00249)


[4m[1m > EPOCH: 906/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:20:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 16325[0m
     | > loss: -0.56621  (-0.61789)
     | > log_mle: -0.65287  (-0.70689)
     | > loss_dur: 0.08666  (0.08900)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 5.48889  (10.02853)
     | > current_lr: 0.00023 
     | > step_time: 0.84780  (0.76853)
     | > loader_time: 0.47840  (0.48909)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00100)
     | > avg_loss:[92m 0.45693 [0m(-0.04406)
     | > avg_log_mle:[92m -0.32579 [0m(-0.04176)
     | > avg_loss_dur:[92m 0.78272 [0m(-0.00230)


[4m[1m > EPOCH: 907/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:21:10) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06506 [0m(+0.00000)
     | > avg_loss:[92m 0.42082 [0m(-0.03611)
     | > avg_log_mle:[91m -0.31778 [0m(+0.00801)
     | > avg_loss_dur:[92m 0.73860 [0m(-0.04412)


[4m[1m > EPOCH: 908/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:21:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 16350[0m
     | > loss: -0.60284  (-0.67949)
     | > log_mle: -0.69833  (-0.76102)
     | > loss_dur: 0.09549  (0.08154)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.08019  (19.76346)
     | > current_lr: 0.00023 
     | > step_time: 0.64160  (0.67144)
     | > loader_time: 0.38740  (0.41755)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.01001)
     | > avg_loss:[91m 0.47076 [0m(+0.04994)
     | > avg_log_mle:[92m -0.31806 [0m(-0.00028)
     | > avg_loss_dur:[91m 0.78882 [0m(+0.05022)


[4m[1m > EPOCH: 909/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:22:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 16375[0m
     | > loss: -0.54378  (-0.65432)
     | > log_mle: -0.64477  (-0.73535)
     | > loss_dur: 0.10099  (0.08103)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.48143  (14.87171)
     | > current_lr: 0.00023 
     | > step_time: 0.78570  (0.71950)
     | > loader_time: 0.47840  (0.46204)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00300)
     | > avg_loss:[91m 0.47821 [0m(+0.00745)
     | > avg_log_mle:[91m -0.29520 [0m(+0.02286)
     | > avg_loss_dur:[92m 0.77341 [0m(-0.01541)


[4m[1m > EPOCH: 910/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:22:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00300)
     | > avg_loss:[91m 0.49612 [0m(+0.01790)
     | > avg_log_mle:[92m -0.31736 [0m(-0.02217)
     | > avg_loss_dur:[91m 0.81348 [0m(+0.04007)


[4m[1m > EPOCH: 911/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:23:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 16400[0m
     | > loss: -0.75760  (-0.76027)
     | > log_mle: -0.82122  (-0.82389)
     | > loss_dur: 0.06362  (0.06362)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 3.81281  (6.47108)
     | > current_lr: 0.00023 
     | > step_time: 0.55350  (0.60305)
     | > loader_time: 0.32730  (0.35082)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00000)
     | > avg_loss:[92m 0.46928 [0m(-0.02683)
     | > avg_log_mle:[91m -0.31140 [0m(+0.00597)
     | > avg_loss_dur:[92m 0.78068 [0m(-0.03280)


[4m[1m > EPOCH: 912/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:23:49) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 16425[0m
     | > loss: -0.66577  (-0.68404)
     | > log_mle: -0.74644  (-0.76062)
     | > loss_dur: 0.08067  (0.07658)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.50835  (20.30971)
     | > current_lr: 0.00023 
     | > step_time: 0.87480  (0.69341)
     | > loader_time: 0.59450  (0.43339)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00400)
     | > avg_loss:[92m 0.46840 [0m(-0.00089)
     | > avg_log_mle:[91m -0.31003 [0m(+0.00137)
     | > avg_loss_dur:[92m 0.77842 [0m(-0.00226)


[4m[1m > EPOCH: 913/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:24:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 16450[0m
     | > loss: -0.54680  (-0.64184)
     | > log_mle: -0.64191  (-0.72296)
     | > loss_dur: 0.09511  (0.08113)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.74569  (17.23201)
     | > current_lr: 0.00023 
     | > step_time: 0.95790  (0.76507)
     | > loader_time: 0.62160  (0.49038)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08207 [0m(+0.00901)
     | > avg_loss:[91m 0.51419 [0m(+0.04579)
     | > avg_log_mle:[91m -0.30075 [0m(+0.00928)
     | > avg_loss_dur:[91m 0.81493 [0m(+0.03651)


[4m[1m > EPOCH: 914/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:24:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.01001)
     | > avg_loss:[92m 0.48751 [0m(-0.02668)
     | > avg_log_mle:[91m -0.30060 [0m(+0.00015)
     | > avg_loss_dur:[92m 0.78811 [0m(-0.02683)


[4m[1m > EPOCH: 915/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:25:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 16475[0m
     | > loss: -0.64504  (-0.71271)
     | > log_mle: -0.72868  (-0.78508)
     | > loss_dur: 0.08364  (0.07237)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 7.10735  (8.34311)
     | > current_lr: 0.00023 
     | > step_time: 0.74470  (0.67542)
     | > loader_time: 0.44040  (0.41177)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08107 [0m(+0.00901)
     | > avg_loss:[92m 0.48258 [0m(-0.00493)
     | > avg_log_mle:[92m -0.30229 [0m(-0.00170)
     | > avg_loss_dur:[92m 0.78488 [0m(-0.00323)


[4m[1m > EPOCH: 916/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:25:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 16500[0m
     | > loss: -0.58864  (-0.66817)
     | > log_mle: -0.68045  (-0.74840)
     | > loss_dur: 0.09181  (0.08023)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.64202  (11.68333)
     | > current_lr: 0.00023 
     | > step_time: 0.90880  (0.71373)
     | > loader_time: 0.63160  (0.46717)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.01301)
     | > avg_loss:[92m 0.43469 [0m(-0.04790)
     | > avg_log_mle:[92m -0.31725 [0m(-0.01496)
     | > avg_loss_dur:[92m 0.75194 [0m(-0.03294)


[4m[1m > EPOCH: 917/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:26:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00200)
     | > avg_loss:[92m 0.43303 [0m(-0.00166)
     | > avg_log_mle:[91m -0.31108 [0m(+0.00617)
     | > avg_loss_dur:[92m 0.74411 [0m(-0.00783)


[4m[1m > EPOCH: 918/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:26:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 16525[0m
     | > loss: -0.78309  (-0.78309)
     | > log_mle: -0.84032  (-0.84032)
     | > loss_dur: 0.05723  (0.05723)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.35468  (9.35468)
     | > current_lr: 0.00023 
     | > step_time: 0.65260  (0.65260)
     | > loader_time: 0.36730  (0.36733)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00100)
     | > avg_loss:[91m 0.48764 [0m(+0.05462)
     | > avg_log_mle:[91m -0.29772 [0m(+0.01336)
     | > avg_loss_dur:[91m 0.78536 [0m(+0.04126)


[4m[1m > EPOCH: 919/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:27:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 16550[0m
     | > loss: -0.60100  (-0.68058)
     | > log_mle: -0.69387  (-0.75776)
     | > loss_dur: 0.09288  (0.07717)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 60.07213  (44.83760)
     | > current_lr: 0.00023 
     | > step_time: 0.68060  (0.66823)
     | > loader_time: 0.45440  (0.42101)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07106 [0m(+0.00000)
     | > avg_loss:[91m 0.49523 [0m(+0.00759)
     | > avg_log_mle:[92m -0.30694 [0m(-0.00922)
     | > avg_loss_dur:[91m 0.80217 [0m(+0.01680)


[4m[1m > EPOCH: 920/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:27:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 16575[0m
     | > loss: -0.54961  (-0.64871)
     | > log_mle: -0.64294  (-0.73094)
     | > loss_dur: 0.09334  (0.08223)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.40644  (14.13131)
     | > current_lr: 0.00023 
     | > step_time: 0.87280  (0.75015)
     | > loader_time: 0.52650  (0.47216)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00300)
     | > avg_loss:[92m 0.44828 [0m(-0.04695)
     | > avg_log_mle:[91m -0.29751 [0m(+0.00943)
     | > avg_loss_dur:[92m 0.74579 [0m(-0.05638)


[4m[1m > EPOCH: 921/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:28:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00200)
     | > avg_loss:[91m 0.52631 [0m(+0.07803)
     | > avg_log_mle:[91m -0.29429 [0m(+0.00323)
     | > avg_loss_dur:[91m 0.82059 [0m(+0.07480)


[4m[1m > EPOCH: 922/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:29:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 16600[0m
     | > loss: -0.70268  (-0.71931)
     | > log_mle: -0.77408  (-0.79540)
     | > loss_dur: 0.07140  (0.07609)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.39499  (12.33017)
     | > current_lr: 0.00023 
     | > step_time: 0.73070  (0.65835)
     | > loader_time: 0.51450  (0.42739)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00300)
     | > avg_loss:[92m 0.49107 [0m(-0.03523)
     | > avg_log_mle:[92m -0.30759 [0m(-0.01330)
     | > avg_loss_dur:[92m 0.79866 [0m(-0.02193)


[4m[1m > EPOCH: 923/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:29:31) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 16625[0m
     | > loss: -0.61258  (-0.67659)
     | > log_mle: -0.70269  (-0.75778)
     | > loss_dur: 0.09011  (0.08119)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 37.67990  (16.34547)
     | > current_lr: 0.00023 
     | > step_time: 0.74370  (0.69736)
     | > loader_time: 0.46140  (0.43894)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00801)
     | > avg_loss:[91m 0.57279 [0m(+0.08171)
     | > avg_log_mle:[91m -0.28849 [0m(+0.01910)
     | > avg_loss_dur:[91m 0.86127 [0m(+0.06261)


[4m[1m > EPOCH: 924/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:30:02) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.08007 [0m(+0.01501)
     | > avg_loss:[92m 0.51631 [0m(-0.05647)
     | > avg_log_mle:[92m -0.29894 [0m(-0.01045)
     | > avg_loss_dur:[92m 0.81525 [0m(-0.04602)


[4m[1m > EPOCH: 925/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:30:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 16650[0m
     | > loss: -0.77598  (-0.77598)
     | > log_mle: -0.83690  (-0.83690)
     | > loss_dur: 0.06093  (0.06093)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.70629  (13.70629)
     | > current_lr: 0.00023 
     | > step_time: 0.50050  (0.50045)
     | > loader_time: 0.29230  (0.29227)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.01001)
     | > avg_loss:[91m 0.52668 [0m(+0.01037)
     | > avg_log_mle:[92m -0.30384 [0m(-0.00490)
     | > avg_loss_dur:[91m 0.83052 [0m(+0.01527)


[4m[1m > EPOCH: 926/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:31:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 16675[0m
     | > loss: -0.66801  (-0.70816)
     | > log_mle: -0.74730  (-0.78105)
     | > loss_dur: 0.07929  (0.07289)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.12957  (13.35792)
     | > current_lr: 0.00023 
     | > step_time: 0.64960  (0.66618)
     | > loader_time: 0.39840  (0.41166)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00200)
     | > avg_loss:[91m 0.56758 [0m(+0.04090)
     | > avg_log_mle:[91m -0.29009 [0m(+0.01375)
     | > avg_loss_dur:[91m 0.85768 [0m(+0.02715)


[4m[1m > EPOCH: 927/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:31:34) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 16700[0m
     | > loss: -0.53303  (-0.66016)
     | > log_mle: -0.63833  (-0.73885)
     | > loss_dur: 0.10531  (0.07869)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.59538  (22.53086)
     | > current_lr: 0.00023 
     | > step_time: 1.01890  (0.74218)
     | > loader_time: 0.67460  (0.49238)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00100)
     | > avg_loss:[92m 0.51245 [0m(-0.05513)
     | > avg_log_mle:[92m -0.29409 [0m(-0.00400)
     | > avg_loss_dur:[92m 0.80654 [0m(-0.05114)


[4m[1m > EPOCH: 928/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:32:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00000)
     | > avg_loss:[91m 0.52279 [0m(+0.01034)
     | > avg_log_mle:[92m -0.31285 [0m(-0.01877)
     | > avg_loss_dur:[91m 0.83565 [0m(+0.02911)


[4m[1m > EPOCH: 929/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:32:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 16725[0m
     | > loss: -0.73662  (-0.75166)
     | > log_mle: -0.80610  (-0.81663)
     | > loss_dur: 0.06948  (0.06498)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.21275  (10.70382)
     | > current_lr: 0.00023 
     | > step_time: 0.68760  (0.63291)
     | > loader_time: 0.41140  (0.37601)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06005 [0m(-0.00701)
     | > avg_loss:[92m 0.49985 [0m(-0.02294)
     | > avg_log_mle:[91m -0.30292 [0m(+0.00993)
     | > avg_loss_dur:[92m 0.80277 [0m(-0.03287)


[4m[1m > EPOCH: 930/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:33:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 16750[0m
     | > loss: -0.63650  (-0.68896)
     | > log_mle: -0.71754  (-0.76376)
     | > loss_dur: 0.08104  (0.07480)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.39041  (15.12983)
     | > current_lr: 0.00023 
     | > step_time: 0.70360  (0.69113)
     | > loader_time: 0.47440  (0.42929)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00901)
     | > avg_loss:[91m 0.50722 [0m(+0.00737)
     | > avg_log_mle:[91m -0.29966 [0m(+0.00327)
     | > avg_loss_dur:[91m 0.80688 [0m(+0.00411)


[4m[1m > EPOCH: 931/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:33:39) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 16775[0m
     | > loss: -0.56364  (-0.63986)
     | > log_mle: -0.64700  (-0.72207)
     | > loss_dur: 0.08336  (0.08221)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 13.40950  (21.55722)
     | > current_lr: 0.00023 
     | > step_time: 0.84580  (0.77041)
     | > loader_time: 0.46640  (0.49904)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00500)
     | > avg_loss:[91m 0.52107 [0m(+0.01385)
     | > avg_log_mle:[92m -0.30445 [0m(-0.00480)
     | > avg_loss_dur:[91m 0.82552 [0m(+0.01864)


[4m[1m > EPOCH: 932/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:34:12) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00300)
     | > avg_loss:[92m 0.51647 [0m(-0.00460)
     | > avg_log_mle:[91m -0.28570 [0m(+0.01875)
     | > avg_loss_dur:[92m 0.80218 [0m(-0.02334)


[4m[1m > EPOCH: 933/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:34:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 16800[0m
     | > loss: -0.60171  (-0.69153)
     | > log_mle: -0.68963  (-0.76635)
     | > loss_dur: 0.08793  (0.07481)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.54491  (10.17136)
     | > current_lr: 0.00023 
     | > step_time: 0.63660  (0.66894)
     | > loader_time: 0.38740  (0.41838)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00200)
     | > avg_loss:[92m 0.48954 [0m(-0.02694)
     | > avg_log_mle:[92m -0.30902 [0m(-0.02332)
     | > avg_loss_dur:[92m 0.79856 [0m(-0.00362)


[4m[1m > EPOCH: 934/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:35:13) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 16825[0m
     | > loss: -0.56050  (-0.65479)
     | > log_mle: -0.65824  (-0.74069)
     | > loss_dur: 0.09774  (0.08591)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.17302  (18.10523)
     | > current_lr: 0.00023 
     | > step_time: 0.78970  (0.72374)
     | > loader_time: 0.47340  (0.45064)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00500)
     | > avg_loss:[92m 0.44402 [0m(-0.04551)
     | > avg_log_mle:[91m -0.30494 [0m(+0.00408)
     | > avg_loss_dur:[92m 0.74896 [0m(-0.04960)


[4m[1m > EPOCH: 935/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:35:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07907 [0m(+0.01101)
     | > avg_loss:[91m 0.46995 [0m(+0.02593)
     | > avg_log_mle:[91m -0.29320 [0m(+0.01174)
     | > avg_loss_dur:[91m 0.76315 [0m(+0.01418)


[4m[1m > EPOCH: 936/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:36:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 16850[0m
     | > loss: -0.77294  (-0.78187)
     | > log_mle: -0.83581  (-0.84384)
     | > loss_dur: 0.06287  (0.06197)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 10.92102  (16.89307)
     | > current_lr: 0.00023 
     | > step_time: 0.56550  (0.61006)
     | > loader_time: 0.36230  (0.36533)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00701)
     | > avg_loss:[92m 0.46704 [0m(-0.00291)
     | > avg_log_mle:[92m -0.29760 [0m(-0.00440)
     | > avg_loss_dur:[91m 0.76464 [0m(+0.00150)


[4m[1m > EPOCH: 937/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:36:46) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 16875[0m
     | > loss: -0.64252  (-0.68853)
     | > log_mle: -0.72269  (-0.76386)
     | > loss_dur: 0.08016  (0.07533)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 3.98382  (8.30065)
     | > current_lr: 0.00023 
     | > step_time: 0.87380  (0.69141)
     | > loader_time: 0.61160  (0.43362)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07507 [0m(+0.00300)
     | > avg_loss:[92m 0.45965 [0m(-0.00739)
     | > avg_log_mle:[91m -0.27611 [0m(+0.02149)
     | > avg_loss_dur:[92m 0.73576 [0m(-0.02889)


[4m[1m > EPOCH: 938/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:37:17) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 16900[0m
     | > loss: -0.54047  (-0.62306)
     | > log_mle: -0.63812  (-0.70976)
     | > loss_dur: 0.09765  (0.08669)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.49182  (11.42579)
     | > current_lr: 0.00023 
     | > step_time: 0.95290  (0.76413)
     | > loader_time: 0.61560  (0.47380)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00200)
     | > avg_loss:[91m 0.49322 [0m(+0.03357)
     | > avg_log_mle:[92m -0.29557 [0m(-0.01946)
     | > avg_loss_dur:[91m 0.78879 [0m(+0.05303)


[4m[1m > EPOCH: 939/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:37:48) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00400)
     | > avg_loss:[92m 0.45461 [0m(-0.03862)
     | > avg_log_mle:[92m -0.30264 [0m(-0.00707)
     | > avg_loss_dur:[92m 0.75724 [0m(-0.03155)


[4m[1m > EPOCH: 940/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:38:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 16925[0m
     | > loss: -0.65890  (-0.71559)
     | > log_mle: -0.74245  (-0.78471)
     | > loss_dur: 0.08355  (0.06912)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.50263  (12.20387)
     | > current_lr: 0.00023 
     | > step_time: 0.73970  (0.67521)
     | > loader_time: 0.43340  (0.44841)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07707 [0m(-0.00000)
     | > avg_loss:[91m 0.47201 [0m(+0.01741)
     | > avg_log_mle:[92m -0.30594 [0m(-0.00330)
     | > avg_loss_dur:[91m 0.77795 [0m(+0.02071)


[4m[1m > EPOCH: 941/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:38:51) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 16950[0m
     | > loss: -0.58948  (-0.67944)
     | > log_mle: -0.68557  (-0.75712)
     | > loss_dur: 0.09609  (0.07768)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.70638  (11.18899)
     | > current_lr: 0.00024 
     | > step_time: 0.91180  (0.71448)
     | > loader_time: 0.63960  (0.46092)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07507 [0m(-0.00200)
     | > avg_loss:[92m 0.46114 [0m(-0.01088)
     | > avg_log_mle:[92m -0.30603 [0m(-0.00009)
     | > avg_loss_dur:[92m 0.76716 [0m(-0.01079)


[4m[1m > EPOCH: 942/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:39:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07305 [0m(-0.00202)
     | > avg_loss:[92m 0.44662 [0m(-0.01452)
     | > avg_log_mle:[91m -0.29350 [0m(+0.01253)
     | > avg_loss_dur:[92m 0.74012 [0m(-0.02704)


[4m[1m > EPOCH: 943/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:39:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 16975[0m
     | > loss: -0.75412  (-0.75412)
     | > log_mle: -0.82091  (-0.82091)
     | > loss_dur: 0.06679  (0.06679)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 15.19804  (15.19804)
     | > current_lr: 0.00024 
     | > step_time: 0.65660  (0.65660)
     | > loader_time: 0.36430  (0.36433)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00099)
     | > avg_loss:[91m 0.50619 [0m(+0.05957)
     | > avg_log_mle:[92m -0.30400 [0m(-0.01051)
     | > avg_loss_dur:[91m 0.81020 [0m(+0.07008)


[4m[1m > EPOCH: 944/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:40:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 17000[0m
     | > loss: -0.61664  (-0.68513)
     | > log_mle: -0.71624  (-0.76549)
     | > loss_dur: 0.09960  (0.08036)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 23.86443  (24.11551)
     | > current_lr: 0.00024 
     | > step_time: 0.68060  (0.66636)
     | > loader_time: 0.41840  (0.42776)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00200)
     | > avg_loss:[91m 0.53459 [0m(+0.02840)
     | > avg_log_mle:[91m -0.27466 [0m(+0.02935)
     | > avg_loss_dur:[92m 0.80925 [0m(-0.00095)


[4m[1m > EPOCH: 945/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:40:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 17025[0m
     | > loss: -0.56371  (-0.64065)
     | > log_mle: -0.65367  (-0.72467)
     | > loss_dur: 0.08996  (0.08401)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.78274  (17.77419)
     | > current_lr: 0.00024 
     | > step_time: 0.88180  (0.75362)
     | > loader_time: 0.56750  (0.48097)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00701)
     | > avg_loss:[92m 0.52052 [0m(-0.01408)
     | > avg_log_mle:[92m -0.28602 [0m(-0.01136)
     | > avg_loss_dur:[92m 0.80654 [0m(-0.00271)


[4m[1m > EPOCH: 946/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:41:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00601)
     | > avg_loss:[91m 0.52968 [0m(+0.00916)
     | > avg_log_mle:[91m -0.28541 [0m(+0.00061)
     | > avg_loss_dur:[91m 0.81509 [0m(+0.00855)


[4m[1m > EPOCH: 947/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:41:55) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 17050[0m
     | > loss: -0.70256  (-0.74840)
     | > log_mle: -0.77344  (-0.81564)
     | > loss_dur: 0.07088  (0.06724)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 16.90914  (12.10261)
     | > current_lr: 0.00024 
     | > step_time: 0.73270  (0.65935)
     | > loader_time: 0.48540  (0.38760)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00500)
     | > avg_loss:[91m 0.53814 [0m(+0.00846)
     | > avg_log_mle:[92m -0.29404 [0m(-0.00862)
     | > avg_loss_dur:[91m 0.83217 [0m(+0.01708)


[4m[1m > EPOCH: 948/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:42:26) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 17075[0m
     | > loss: -0.62048  (-0.68441)
     | > log_mle: -0.70271  (-0.76054)
     | > loss_dur: 0.08224  (0.07613)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 14.36259  (12.14346)
     | > current_lr: 0.00024 
     | > step_time: 0.73870  (0.69572)
     | > loader_time: 0.44340  (0.44213)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00100)
     | > avg_loss:[92m 0.45302 [0m(-0.08512)
     | > avg_log_mle:[92m -0.29784 [0m(-0.00381)
     | > avg_loss_dur:[92m 0.75086 [0m(-0.08131)


[4m[1m > EPOCH: 949/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:42:57) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00200)
     | > avg_loss:[91m 0.51712 [0m(+0.06410)
     | > avg_log_mle:[91m -0.29070 [0m(+0.00714)
     | > avg_loss_dur:[91m 0.80782 [0m(+0.05695)


[4m[1m > EPOCH: 950/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:43:29) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 17100[0m
     | > loss: -0.78902  (-0.78902)
     | > log_mle: -0.84846  (-0.84846)
     | > loss_dur: 0.05944  (0.05944)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 22.65879  (22.65879)
     | > current_lr: 0.00024 
     | > step_time: 0.62360  (0.62357)
     | > loader_time: 0.27530  (0.27525)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07206 [0m(+0.00300)
     | > avg_loss:[92m 0.47584 [0m(-0.04128)
     | > avg_log_mle:[92m -0.29563 [0m(-0.00494)
     | > avg_loss_dur:[92m 0.77148 [0m(-0.03634)


[4m[1m > EPOCH: 951/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:43:59) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 17125[0m
     | > loss: -0.63035  (-0.69041)
     | > log_mle: -0.71853  (-0.76850)
     | > loss_dur: 0.08818  (0.07809)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 20.35356  (20.82917)
     | > current_lr: 0.00024 
     | > step_time: 0.64960  (0.66847)
     | > loader_time: 0.41140  (0.40608)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.51188 [0m(+0.03603)
     | > avg_log_mle:[91m -0.28485 [0m(+0.01078)
     | > avg_loss_dur:[91m 0.79672 [0m(+0.02525)


[4m[1m > EPOCH: 952/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:44:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 17150[0m
     | > loss: -0.56971  (-0.64925)
     | > log_mle: -0.66779  (-0.73380)
     | > loss_dur: 0.09808  (0.08455)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 8.40587  (13.88635)
     | > current_lr: 0.00024 
     | > step_time: 1.02390  (0.74325)
     | > loader_time: 0.61060  (0.46521)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00100)
     | > avg_loss:[92m 0.49874 [0m(-0.01313)
     | > avg_log_mle:[92m -0.28543 [0m(-0.00058)
     | > avg_loss_dur:[92m 0.78417 [0m(-0.01255)


[4m[1m > EPOCH: 953/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:45:01) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00000)
     | > avg_loss:[91m 0.50765 [0m(+0.00891)
     | > avg_log_mle:[92m -0.28545 [0m(-0.00002)
     | > avg_loss_dur:[91m 0.79310 [0m(+0.00893)


[4m[1m > EPOCH: 954/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:45:33) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 17175[0m
     | > loss: -0.76447  (-0.76769)
     | > log_mle: -0.82719  (-0.82928)
     | > loss_dur: 0.06272  (0.06159)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.52343  (16.02389)
     | > current_lr: 0.00024 
     | > step_time: 0.68560  (0.63658)
     | > loader_time: 0.42040  (0.38201)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00601)
     | > avg_loss:[92m 0.48106 [0m(-0.02660)
     | > avg_log_mle:[91m -0.27613 [0m(+0.00932)
     | > avg_loss_dur:[92m 0.75718 [0m(-0.03592)


[4m[1m > EPOCH: 955/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:46:04) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 17200[0m
     | > loss: -0.64416  (-0.69505)
     | > log_mle: -0.72373  (-0.76917)
     | > loss_dur: 0.07957  (0.07412)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 13.98944  (16.61464)
     | > current_lr: 0.00024 
     | > step_time: 0.70360  (0.69343)
     | > loader_time: 0.44240  (0.43609)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.01201)
     | > avg_loss:[91m 0.49552 [0m(+0.01446)
     | > avg_log_mle:[92m -0.28037 [0m(-0.00425)
     | > avg_loss_dur:[91m 0.77589 [0m(+0.01871)


[4m[1m > EPOCH: 956/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:46:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 17225[0m
     | > loss: -0.59056  (-0.66080)
     | > log_mle: -0.66782  (-0.73935)
     | > loss_dur: 0.07726  (0.07856)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 26.83610  (17.11574)
     | > current_lr: 0.00024 
     | > step_time: 0.84780  (0.76953)
     | > loader_time: 0.43440  (0.49150)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07006 [0m(+0.00400)
     | > avg_loss:[91m 0.52768 [0m(+0.03216)
     | > avg_log_mle:[91m -0.27079 [0m(+0.00959)
     | > avg_loss_dur:[91m 0.79847 [0m(+0.02258)


[4m[1m > EPOCH: 957/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:47:06) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00601)
     | > avg_loss:[92m 0.49341 [0m(-0.03427)
     | > avg_log_mle:[92m -0.27727 [0m(-0.00648)
     | > avg_loss_dur:[92m 0.77068 [0m(-0.02779)


[4m[1m > EPOCH: 958/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:47:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 17250[0m
     | > loss: -0.59573  (-0.71621)
     | > log_mle: -0.69491  (-0.78975)
     | > loss_dur: 0.09919  (0.07354)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 9.91467  (16.81496)
     | > current_lr: 0.00024 
     | > step_time: 0.64460  (0.67411)
     | > loader_time: 0.42440  (0.41438)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00701)
     | > avg_loss:[91m 0.49578 [0m(+0.00237)
     | > avg_log_mle:[91m -0.27601 [0m(+0.00126)
     | > avg_loss_dur:[91m 0.77178 [0m(+0.00111)


[4m[1m > EPOCH: 959/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:48:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 17275[0m
     | > loss: -0.58646  (-0.68215)
     | > log_mle: -0.67872  (-0.76066)
     | > loss_dur: 0.09226  (0.07852)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 14.85128  (14.83883)
     | > current_lr: 0.00024 
     | > step_time: 0.78370  (0.72135)
     | > loader_time: 0.48140  (0.45310)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.00300)
     | > avg_loss:[91m 0.52805 [0m(+0.03228)
     | > avg_log_mle:[91m -0.27403 [0m(+0.00197)
     | > avg_loss_dur:[91m 0.80209 [0m(+0.03030)


[4m[1m > EPOCH: 960/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:48:38) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00100)
     | > avg_loss:[92m 0.44663 [0m(-0.08142)
     | > avg_log_mle:[92m -0.28208 [0m(-0.00804)
     | > avg_loss_dur:[92m 0.72871 [0m(-0.07338)


[4m[1m > EPOCH: 961/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:49:09) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 17300[0m
     | > loss: -0.79414  (-0.79423)
     | > log_mle: -0.85414  (-0.85274)
     | > loss_dur: 0.06000  (0.05851)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 20.46134  (13.48166)
     | > current_lr: 0.00024 
     | > step_time: 0.56250  (0.60755)
     | > loader_time: 0.36030  (0.35983)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00701)
     | > avg_loss:[91m 0.56626 [0m(+0.11963)
     | > avg_log_mle:[91m -0.27846 [0m(+0.00361)
     | > avg_loss_dur:[91m 0.84473 [0m(+0.11602)


[4m[1m > EPOCH: 962/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:49:41) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 17325[0m
     | > loss: -0.69130  (-0.70885)
     | > log_mle: -0.76984  (-0.78399)
     | > loss_dur: 0.07854  (0.07514)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 10.42475  (13.22633)
     | > current_lr: 0.00024 
     | > step_time: 0.87080  (0.69152)
     | > loader_time: 0.54650  (0.43184)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00400)
     | > avg_loss:[92m 0.49087 [0m(-0.07539)
     | > avg_log_mle:[92m -0.28712 [0m(-0.00866)
     | > avg_loss_dur:[92m 0.77799 [0m(-0.06673)


[4m[1m > EPOCH: 963/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:50:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 17350[0m
     | > loss: -0.60009  (-0.65703)
     | > log_mle: -0.68103  (-0.73619)
     | > loss_dur: 0.08093  (0.07915)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 7.00764  (19.42701)
     | > current_lr: 0.00024 
     | > step_time: 0.95690  (0.76584)
     | > loader_time: 0.58750  (0.48952)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00300)
     | > avg_loss:[92m 0.48321 [0m(-0.00767)
     | > avg_log_mle:[91m -0.28690 [0m(+0.00022)
     | > avg_loss_dur:[92m 0.77011 [0m(-0.00788)


[4m[1m > EPOCH: 964/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:50:43) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00400)
     | > avg_loss:[91m 0.48623 [0m(+0.00303)
     | > avg_log_mle:[91m -0.27621 [0m(+0.01069)
     | > avg_loss_dur:[92m 0.76244 [0m(-0.00767)


[4m[1m > EPOCH: 965/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:51:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 17375[0m
     | > loss: -0.66745  (-0.73375)
     | > log_mle: -0.75056  (-0.80381)
     | > loss_dur: 0.08311  (0.07006)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 5.52402  (10.37945)
     | > current_lr: 0.00024 
     | > step_time: 0.74070  (0.67842)
     | > loader_time: 0.47340  (0.42038)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00701)
     | > avg_loss:[91m 0.55716 [0m(+0.07093)
     | > avg_log_mle:[91m -0.27088 [0m(+0.00533)
     | > avg_loss_dur:[91m 0.82804 [0m(+0.06560)


[4m[1m > EPOCH: 966/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:51:45) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 17400[0m
     | > loss: -0.62374  (-0.68216)
     | > log_mle: -0.70766  (-0.76309)
     | > loss_dur: 0.08392  (0.08093)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 27.44072  (16.06729)
     | > current_lr: 0.00024 
     | > step_time: 0.91780  (0.71832)
     | > loader_time: 0.64060  (0.46209)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00100)
     | > avg_loss:[92m 0.46824 [0m(-0.08892)
     | > avg_log_mle:[92m -0.27858 [0m(-0.00770)
     | > avg_loss_dur:[92m 0.74682 [0m(-0.08122)


[4m[1m > EPOCH: 967/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:52:16) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00801)
     | > avg_loss:[91m 0.54920 [0m(+0.08096)
     | > avg_log_mle:[91m -0.27527 [0m(+0.00331)
     | > avg_loss_dur:[91m 0.82447 [0m(+0.07765)


[4m[1m > EPOCH: 968/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:52:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 17425[0m
     | > loss: -0.81656  (-0.81656)
     | > log_mle: -0.87174  (-0.87174)
     | > loss_dur: 0.05518  (0.05518)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 11.03277  (11.03277)
     | > current_lr: 0.00024 
     | > step_time: 0.65360  (0.65360)
     | > loader_time: 0.38430  (0.38435)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00701)
     | > avg_loss:[91m 0.55280 [0m(+0.00359)
     | > avg_log_mle:[91m -0.25145 [0m(+0.02383)
     | > avg_loss_dur:[92m 0.80424 [0m(-0.02023)


[4m[1m > EPOCH: 969/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:53:19) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 17450[0m
     | > loss: -0.66894  (-0.71210)
     | > log_mle: -0.75127  (-0.78449)
     | > loss_dur: 0.08233  (0.07240)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 19.47171  (19.01457)
     | > current_lr: 0.00024 
     | > step_time: 0.67860  (0.66736)
     | > loader_time: 0.42140  (0.40562)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06306 [0m(+0.00100)
     | > avg_loss:[92m 0.48896 [0m(-0.06384)
     | > avg_log_mle:[92m -0.26822 [0m(-0.01678)
     | > avg_loss_dur:[92m 0.75719 [0m(-0.04706)


[4m[1m > EPOCH: 970/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:53:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 17475[0m
     | > loss: -0.57276  (-0.68025)
     | > log_mle: -0.66423  (-0.75597)
     | > loss_dur: 0.09147  (0.07572)
     | > amp_scaler: 16384.00000  (16384.00000)
     | > grad_norm: 19.09972  (18.43623)
     | > current_lr: 0.00024 
     | > step_time: 0.87680  (0.75175)
     | > loader_time: 0.52850  (0.47350)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06306 [0m(+0.00000)
     | > avg_loss:[91m 0.49859 [0m(+0.00963)
     | > avg_log_mle:[91m -0.26469 [0m(+0.00353)
     | > avg_loss_dur:[91m 0.76328 [0m(+0.00609)


[4m[1m > EPOCH: 971/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:54:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07207 [0m(+0.00901)
     | > avg_loss:[91m 0.50629 [0m(+0.00770)
     | > avg_log_mle:[91m -0.25024 [0m(+0.01445)
     | > avg_loss_dur:[92m 0.75652 [0m(-0.00675)


[4m[1m > EPOCH: 972/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:54:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 17500[0m
     | > loss: -0.69434  (-0.75157)
     | > log_mle: -0.76912  (-0.81727)
     | > loss_dur: 0.07478  (0.06570)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 27.83111  (30.76116)
     | > current_lr: 0.00024 
     | > step_time: 0.73670  (0.66335)
     | > loader_time: 0.47440  (0.41938)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00100)
     | > avg_loss:[91m 0.50892 [0m(+0.00263)
     | > avg_log_mle:[92m -0.27609 [0m(-0.02586)
     | > avg_loss_dur:[91m 0.78501 [0m(+0.02849)


[4m[1m > EPOCH: 973/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:55:23) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 17525[0m
     | > loss: -0.65035  (-0.70172)
     | > log_mle: -0.73049  (-0.77544)
     | > loss_dur: 0.08015  (0.07372)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 14.68224  (14.96100)
     | > current_lr: 0.00024 
     | > step_time: 0.73470  (0.69727)
     | > loader_time: 0.47440  (0.45214)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00100)
     | > avg_loss:[92m 0.47672 [0m(-0.03219)
     | > avg_log_mle:[91m -0.25948 [0m(+0.01662)
     | > avg_loss_dur:[92m 0.73620 [0m(-0.04881)


[4m[1m > EPOCH: 974/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:55:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time: 0.07407 [0m(+0.00000)
     | > avg_loss:[91m 0.50088 [0m(+0.02416)
     | > avg_log_mle:[92m -0.26104 [0m(-0.00157)
     | > avg_loss_dur:[91m 0.76193 [0m(+0.02573)


[4m[1m > EPOCH: 975/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:56:25) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 0/18 -- GLOBAL_STEP: 17550[0m
     | > loss: -0.79260  (-0.79260)
     | > log_mle: -0.85232  (-0.85232)
     | > loss_dur: 0.05973  (0.05973)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.63806  (18.63806)
     | > current_lr: 0.00024 
     | > step_time: 0.50150  (0.50146)
     | > loader_time: 0.29230  (0.29225)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00200)
     | > avg_loss:[92m 0.50033 [0m(-0.00056)
     | > avg_log_mle:[91m -0.25149 [0m(+0.00955)
     | > avg_loss_dur:[92m 0.75182 [0m(-0.01011)


[4m[1m > EPOCH: 976/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:56:56) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 7/18 -- GLOBAL_STEP: 17575[0m
     | > loss: -0.67505  (-0.71848)
     | > log_mle: -0.75589  (-0.79039)
     | > loss_dur: 0.08084  (0.07191)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 12.55125  (17.06153)
     | > current_lr: 0.00024 
     | > step_time: 0.64960  (0.66832)
     | > loader_time: 0.42140  (0.41623)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07106 [0m(-0.00100)
     | > avg_loss:[91m 0.52705 [0m(+0.02672)
     | > avg_log_mle:[92m -0.26779 [0m(-0.01630)
     | > avg_loss_dur:[91m 0.79485 [0m(+0.04302)


[4m[1m > EPOCH: 977/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:57:27) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 14/18 -- GLOBAL_STEP: 17600[0m
     | > loss: -0.57298  (-0.66883)
     | > log_mle: -0.66524  (-0.74787)
     | > loss_dur: 0.09227  (0.07904)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.34129  (14.74397)
     | > current_lr: 0.00024 
     | > step_time: 1.01490  (0.74210)
     | > loader_time: 0.62060  (0.47021)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00500)
     | > avg_loss:[92m 0.42885 [0m(-0.09820)
     | > avg_log_mle:[92m -0.27892 [0m(-0.01112)
     | > avg_loss_dur:[92m 0.70776 [0m(-0.08708)


[4m[1m > EPOCH: 978/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:57:58) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00701)
     | > avg_loss:[91m 0.48456 [0m(+0.05571)
     | > avg_log_mle:[91m -0.26278 [0m(+0.01614)
     | > avg_loss_dur:[91m 0.74734 [0m(+0.03958)


[4m[1m > EPOCH: 979/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:58:30) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 3/18 -- GLOBAL_STEP: 17625[0m
     | > loss: -0.73164  (-0.76363)
     | > log_mle: -0.80594  (-0.83025)
     | > loss_dur: 0.07430  (0.06662)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 20.56582  (19.25051)
     | > current_lr: 0.00024 
     | > step_time: 0.68660  (0.63591)
     | > loader_time: 0.42440  (0.37834)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07807 [0m(+0.00901)
     | > avg_loss:[92m 0.47588 [0m(-0.00867)
     | > avg_log_mle:[92m -0.26746 [0m(-0.00468)
     | > avg_loss_dur:[92m 0.74335 [0m(-0.00399)


[4m[1m > EPOCH: 980/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:59:00) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 10/18 -- GLOBAL_STEP: 17650[0m
     | > loss: -0.67839  (-0.71515)
     | > log_mle: -0.75181  (-0.78713)
     | > loss_dur: 0.07342  (0.07198)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.71863  (14.93924)
     | > current_lr: 0.00024 
     | > step_time: 0.70160  (0.69303)
     | > loader_time: 0.42540  (0.44781)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07207 [0m(-0.00601)
     | > avg_loss:[91m 0.50717 [0m(+0.03128)
     | > avg_log_mle:[91m -0.26077 [0m(+0.00669)
     | > avg_loss_dur:[91m 0.76794 [0m(+0.02459)


[4m[1m > EPOCH: 981/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 14:59:32) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 17/18 -- GLOBAL_STEP: 17675[0m
     | > loss: -0.55950  (-0.66067)
     | > log_mle: -0.63789  (-0.73812)
     | > loss_dur: 0.07839  (0.07745)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 35.51043  (13.46899)
     | > current_lr: 0.00025 
     | > step_time: 0.85180  (0.76926)
     | > loader_time: 0.45540  (0.49192)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07206 [0m(-0.00000)
     | > avg_loss:[91m 0.58617 [0m(+0.07901)
     | > avg_log_mle:[91m -0.24697 [0m(+0.01381)
     | > avg_loss_dur:[91m 0.83314 [0m(+0.06520)


[4m[1m > EPOCH: 982/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:00:03) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00701)
     | > avg_loss:[92m 0.47047 [0m(-0.11570)
     | > avg_log_mle:[92m -0.28640 [0m(-0.03943)
     | > avg_loss_dur:[92m 0.75687 [0m(-0.07627)


[4m[1m > EPOCH: 983/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:00:35) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 6/18 -- GLOBAL_STEP: 17700[0m
     | > loss: -0.59961  (-0.70356)
     | > log_mle: -0.69766  (-0.78049)
     | > loss_dur: 0.09805  (0.07693)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.39470  (16.57480)
     | > current_lr: 0.00025 
     | > step_time: 0.64460  (0.67111)
     | > loader_time: 0.39240  (0.41688)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06706 [0m(+0.00200)
     | > avg_loss:[91m 0.53428 [0m(+0.06381)
     | > avg_log_mle:[91m -0.27516 [0m(+0.01125)
     | > avg_loss_dur:[91m 0.80943 [0m(+0.05256)


[4m[1m > EPOCH: 984/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:01:05) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 13/18 -- GLOBAL_STEP: 17725[0m
     | > loss: -0.58789  (-0.69097)
     | > log_mle: -0.67902  (-0.76608)
     | > loss_dur: 0.09113  (0.07511)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 11.02408  (12.12756)
     | > current_lr: 0.00025 
     | > step_time: 0.78370  (0.71789)
     | > loader_time: 0.51750  (0.45734)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00601)
     | > avg_loss:[92m 0.49695 [0m(-0.03733)
     | > avg_log_mle:[91m -0.25791 [0m(+0.01724)
     | > avg_loss_dur:[92m 0.75486 [0m(-0.05457)


[4m[1m > EPOCH: 985/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:01:37) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07006 [0m(-0.00300)
     | > avg_loss:[92m 0.47263 [0m(-0.02432)
     | > avg_log_mle:[92m -0.26692 [0m(-0.00901)
     | > avg_loss_dur:[92m 0.73955 [0m(-0.01531)


[4m[1m > EPOCH: 986/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:02:08) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 2/18 -- GLOBAL_STEP: 17750[0m
     | > loss: -0.79316  (-0.79557)
     | > log_mle: -0.85448  (-0.85493)
     | > loss_dur: 0.06132  (0.05935)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 22.26439  (25.52349)
     | > current_lr: 0.00025 
     | > step_time: 0.56550  (0.61006)
     | > loader_time: 0.35130  (0.35883)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06206 [0m(-0.00801)
     | > avg_loss:[91m 0.57799 [0m(+0.10536)
     | > avg_log_mle:[91m -0.26337 [0m(+0.00354)
     | > avg_loss_dur:[91m 0.84137 [0m(+0.10182)


[4m[1m > EPOCH: 987/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:02:40) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 9/18 -- GLOBAL_STEP: 17775[0m
     | > loss: -0.71211  (-0.70167)
     | > log_mle: -0.78849  (-0.77835)
     | > loss_dur: 0.07638  (0.07668)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 4.41244  (16.19505)
     | > current_lr: 0.00025 
     | > step_time: 0.86680  (0.69330)
     | > loader_time: 0.59350  (0.43907)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.01101)
     | > avg_loss:[92m 0.49078 [0m(-0.08722)
     | > avg_log_mle:[91m -0.25431 [0m(+0.00906)
     | > avg_loss_dur:[92m 0.74509 [0m(-0.09628)


[4m[1m > EPOCH: 988/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:03:11) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 16/18 -- GLOBAL_STEP: 17800[0m
     | > loss: -0.58386  (-0.67251)
     | > log_mle: -0.67313  (-0.75376)
     | > loss_dur: 0.08927  (0.08125)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 8.05139  (16.21692)
     | > current_lr: 0.00025 
     | > step_time: 0.95290  (0.76270)
     | > loader_time: 0.60560  (0.48594)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06706 [0m(-0.00601)
     | > avg_loss:[92m 0.46440 [0m(-0.02638)
     | > avg_log_mle:[91m -0.24974 [0m(+0.00457)
     | > avg_loss_dur:[92m 0.71414 [0m(-0.03095)


[4m[1m > EPOCH: 989/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:03:42) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.06906 [0m(+0.00200)
     | > avg_loss:[91m 0.51760 [0m(+0.05320)
     | > avg_log_mle:[91m -0.24365 [0m(+0.00610)
     | > avg_loss_dur:[91m 0.76125 [0m(+0.04711)


[4m[1m > EPOCH: 990/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:04:14) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 5/18 -- GLOBAL_STEP: 17825[0m
     | > loss: -0.67197  (-0.73193)
     | > log_mle: -0.75694  (-0.80610)
     | > loss_dur: 0.08497  (0.07417)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 18.23219  (16.88915)
     | > current_lr: 0.00025 
     | > step_time: 0.74470  (0.67421)
     | > loader_time: 0.46340  (0.43259)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06506 [0m(-0.00400)
     | > avg_loss:[92m 0.47641 [0m(-0.04119)
     | > avg_log_mle:[92m -0.24981 [0m(-0.00617)
     | > avg_loss_dur:[92m 0.72623 [0m(-0.03502)


[4m[1m > EPOCH: 991/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:04:44) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 12/18 -- GLOBAL_STEP: 17850[0m
     | > loss: -0.60162  (-0.69232)
     | > log_mle: -0.69206  (-0.76964)
     | > loss_dur: 0.09044  (0.07732)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 29.78607  (17.71965)
     | > current_lr: 0.00025 
     | > step_time: 0.91480  (0.71407)
     | > loader_time: 0.65860  (0.47418)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07307 [0m(+0.00801)
     | > avg_loss:[91m 0.50605 [0m(+0.02963)
     | > avg_log_mle:[92m -0.25974 [0m(-0.00993)
     | > avg_loss_dur:[91m 0.76579 [0m(+0.03956)


[4m[1m > EPOCH: 992/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:05:15) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.07307 [0m(-0.00000)
     | > avg_loss:[91m 0.53829 [0m(+0.03224)
     | > avg_log_mle:[92m -0.26437 [0m(-0.00463)
     | > avg_loss_dur:[91m 0.80266 [0m(+0.03687)


[4m[1m > EPOCH: 993/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:05:47) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 1/18 -- GLOBAL_STEP: 17875[0m
     | > loss: -0.80044  (-0.80044)
     | > log_mle: -0.86059  (-0.86059)
     | > loss_dur: 0.06015  (0.06015)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 9.77488  (9.77488)
     | > current_lr: 0.00025 
     | > step_time: 0.65660  (0.65660)
     | > loader_time: 0.40540  (0.40537)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07407 [0m(+0.00100)
     | > avg_loss:[92m 0.51506 [0m(-0.02323)
     | > avg_log_mle:[91m -0.26245 [0m(+0.00193)
     | > avg_loss_dur:[92m 0.77751 [0m(-0.02516)


[4m[1m > EPOCH: 994/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:06:18) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 8/18 -- GLOBAL_STEP: 17900[0m
     | > loss: -0.67674  (-0.72486)
     | > log_mle: -0.75434  (-0.79619)
     | > loss_dur: 0.07760  (0.07133)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.46316  (16.80987)
     | > current_lr: 0.00025 
     | > step_time: 0.67860  (0.66961)
     | > loader_time: 0.41140  (0.41225)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06906 [0m(-0.00500)
     | > avg_loss:[92m 0.43964 [0m(-0.07542)
     | > avg_log_mle:[91m -0.26082 [0m(+0.00163)
     | > avg_loss_dur:[92m 0.70046 [0m(-0.07705)


[4m[1m > EPOCH: 995/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:06:50) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 15/18 -- GLOBAL_STEP: 17925[0m
     | > loss: -0.59943  (-0.68072)
     | > log_mle: -0.68644  (-0.75803)
     | > loss_dur: 0.08701  (0.07731)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 17.48553  (18.26606)
     | > current_lr: 0.00025 
     | > step_time: 0.87780  (0.75135)
     | > loader_time: 0.57650  (0.46409)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06806 [0m(-0.00100)
     | > avg_loss:[91m 0.54386 [0m(+0.10422)
     | > avg_log_mle:[91m -0.25159 [0m(+0.00923)
     | > avg_loss_dur:[91m 0.79545 [0m(+0.09499)


[4m[1m > EPOCH: 996/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:07:21) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.00801)
     | > avg_loss:[92m 0.51809 [0m(-0.02577)
     | > avg_log_mle:[92m -0.25631 [0m(-0.00472)
     | > avg_loss_dur:[92m 0.77440 [0m(-0.02105)


[4m[1m > EPOCH: 997/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:07:52) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 4/18 -- GLOBAL_STEP: 17950[0m
     | > loss: -0.74415  (-0.78143)
     | > log_mle: -0.80982  (-0.84213)
     | > loss_dur: 0.06566  (0.06070)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 6.82899  (10.90278)
     | > current_lr: 0.00025 
     | > step_time: 0.73270  (0.66010)
     | > loader_time: 0.49750  (0.39786)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07707 [0m(+0.00100)
     | > avg_loss:[91m 0.56006 [0m(+0.04197)
     | > avg_log_mle:[91m -0.24821 [0m(+0.00810)
     | > avg_loss_dur:[91m 0.80827 [0m(+0.03387)


[4m[1m > EPOCH: 998/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:08:22) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m   --> STEP: 11/18 -- GLOBAL_STEP: 17975[0m
     | > loss: -0.65338  (-0.71233)
     | > log_mle: -0.73612  (-0.78550)
     | > loss_dur: 0.08274  (0.07317)
     | > amp_scaler: 8192.00000  (8192.00000)
     | > grad_norm: 16.44300  (17.35177)
     | > current_lr: 0.00025 
     | > step_time: 0.73870  (0.69891)
     | > loader_time: 0.43240  (0.43476)


[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[92m 0.06606 [0m(-0.01101)
     | > avg_loss:[92m 0.54186 [0m(-0.01820)
     | > avg_log_mle:[92m -0.25984 [0m(-0.01163)
     | > avg_loss_dur:[92m 0.80170 [0m(-0.00657)


[4m[1m > EPOCH: 999/1000[0m
 --> ./output\run-September-15-2022_04+45AM-910d77a

[1m > TRAINING (2022-09-15 15:08:54) [0m




> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 1129
 | > Preprocessing samples
 | > Max text length: 81
 | > Min text length: 8
 | > Avg text length: 49.47475642161205
 | 
 | > Max audio length: 140760.0
 | > Min audio length: 24055.0
 | > Avg audio length: 66621.55358724535
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.



[1m > EVALUATION [0m





> DataLoader initialization
| > Tokenizer:
	| > add_blank: False
	| > use_eos_bos: False
	| > use_phonemes: True
	| > phonemizer:
		| > phoneme language: en-us
		| > phoneme backend: gruut
| > Number of instances : 11
 | > Preprocessing samples
 | > Max text length: 54
 | > Min text length: 21
 | > Avg text length: 44.54545454545455
 | 
 | > Max audio length: 82620.0
 | > Min audio length: 21798.0
 | > Avg audio length: 57012.0
 | > Num. instances discarded samples: 0
 | > Batch group size: 0.
 | > Synthesizing test sentences.



  [1m--> EVAL PERFORMANCE[0m
     | > avg_loader_time:[91m 0.07607 [0m(+0.01001)
     | > avg_loss:[91m 0.55008 [0m(+0.00822)
     | > avg_log_mle:[91m -0.25137 [0m(+0.00847)
     | > avg_loss_dur:[92m 0.80145 [0m(-0.00025)



In [13]:
%load_ext tensorboard

In [14]:
%tensorboard --logdir="./output\run-September-15-2022_04+45AM-910d77a"

In [None]:
!kill 12