In [1]:
from models import VAE, LARGER_VAE
from train import train, validate, save_checkpoint
from data_loader import load_cifar10_data
from torch.nn import MSELoss
from torch.optim import Adam
import torch
from torch.utils.tensorboard import SummaryWriter
from vae_loss import VAE_Loss
from loggers import VAE_LOGGER
from metrics import FIDMetric

In [2]:
train_loader, val_loader, test_loader = load_cifar10_data()
# Print the total size (number of samples) of each dataset
print("Total number of training samples:", len(train_loader.dataset))
print("Total number of validation samples:", len(val_loader.dataset))
print("Total number of test samples:", len(test_loader.dataset))

Files already downloaded and verified
Files already downloaded and verified
Total number of training samples: 45000
Total number of validation samples: 5000
Total number of test samples: 10000


In [None]:
# Hyperparameters
epochs = 1000
learning_rate = 1e-5#0.0001
log_interval = 100

# Device configuration
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

# Model, loss function, and optimizer
model = VAE(latent_dim=1024).to(device)  # Example model; replace with any model
criterion = VAE_Loss()
optimizer = Adam(model.parameters(), lr=learning_rate)
metric = FIDMetric(device)
# TensorBoard writer
logger = VAE_LOGGER(SummaryWriter())
best_checkpoint_path = "VAE_MODEL_1e-5_lr1e-5/best_ckpt.pth"

# Training loop
best_val_loss = float('inf')
for epoch in range(1, epochs + 1):
    train(model, train_loader, criterion, optimizer, device, epoch, logger, log_interval)
    val_loss, fid_score = validate(model, val_loader, criterion, device, epoch, logger,metric)
    
    # Save checkpoint if validation loss improves
    if val_loss < best_val_loss:
        print(f"Validation loss improved from {best_val_loss:.4f} to {val_loss:.4f}. Saving model...")
        best_val_loss = val_loss
        save_checkpoint(model,best_checkpoint_path)

Epoch 1 [Train]:   0%|          | 1/704 [00:00<04:42,  2.49it/s]

KL tensor(11003.2559, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0968, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8773.8359, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1003, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8546.4414, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0876, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7563.0674, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0910, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6498.6543, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0870, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4986.4385, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0942, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3944.5972, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1004, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3161.7686, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0940, device='cuda:0', grad_fn=<Ms

Epoch 1 [Train]:   6%|▌         | 39/704 [00:00<00:07, 88.15it/s]

KL tensor(1807.9045, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0937, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1905.9891, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0990, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1700.6433, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0883, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1612.5417, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0913, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1650.6946, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0859, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1542.0670, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0998, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1546.0549, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0944, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1619.7252, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0910, device='cuda:0', grad_fn=<Mse

Epoch 1 [Train]:  10%|█         | 72/704 [00:00<00:05, 123.13it/s]

KL tensor(1125.6088, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0888, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(993.9291, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0903, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(945.3600, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0906, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1034.4031, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0895, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(938.7576, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0939, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(942.1714, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0941, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(934.4486, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0920, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(847.7288, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0877, device='cuda:0', grad_fn=<MseLossBa

Epoch 1 [Train]:  15%|█▌        | 107/704 [00:01<00:04, 147.49it/s]

tensor(408.8073, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0981, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(382.7362, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0917, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(338.8533, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0953, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(362.5591, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0960, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(284.7304, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0938, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(319.0980, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0955, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(545.7239, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0924, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(871.5190, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0912, device='cuda:0', grad_fn=<MseLossBackwar

Epoch 1 [Train]:  20%|██        | 141/704 [00:01<00:03, 143.99it/s]

KL tensor(190.4063, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0883, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(189.0655, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0957, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(224.9229, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0911, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(193.9609, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1051, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(201.7198, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0916, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(257.7424, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0944, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(222.3275, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0958, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(226.6984, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0935, device='cuda:0', grad_fn=<MseLossBack

Epoch 1 [Train]:  25%|██▌       | 179/704 [00:01<00:03, 164.09it/s]

KL tensor(149.4512, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0947, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(178.4148, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1024, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(290.4307, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0923, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(182.7829, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0934, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(172.9188, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0922, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(136.4694, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0953, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(167.6248, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0883, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(234.1472, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0891, device='cuda:0', grad_fn=<MseLossBack

Epoch 1 [Train]:  31%|███       | 216/704 [00:01<00:02, 164.82it/s]

KL tensor(180.0414, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1006, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(192.2338, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0878, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(114.7783, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0930, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(160.5969, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0970, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(172.8662, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0916, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(205.2543, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0925, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(160.0978, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0928, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(184.8805, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0967, device='cuda:0', grad_fn=<MseLossBack

Epoch 1 [Train]:  36%|███▌      | 250/704 [00:01<00:02, 165.73it/s]

tensor(0.1000, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(126.7826, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0959, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(111.7286, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0971, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(122.7819, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0949, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(271.6006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0893, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(164.9537, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1001, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(158.9813, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0913, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(209.7440, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0878, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(151.8674, device='cuda:0', grad_fn=<MeanBackward

Epoch 1 [Train]:  40%|████      | 285/704 [00:02<00:02, 167.04it/s]

KL tensor(132.5679, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0889, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(96.4703, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0934, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(111.5286, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1005, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(102.5076, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0924, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(112.2555, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0933, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(134.5525, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0899, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(110.1819, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0952, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(107.5519, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0971, device='cuda:0', grad_fn=<MseLossBackw

Epoch 1 [Train]:  43%|████▎     | 302/704 [00:02<00:02, 167.65it/s]

KL tensor(104.2937, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0916, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(143.0314, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0943, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(105.2752, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1006, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(154.3553, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0902, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(100.1653, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0949, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(93.5178, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0895, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(94.3974, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0902, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(123.7060, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0912, device='cuda:0', grad_fn=<MseLossBackwa

Epoch 1 [Train]:  51%|█████     | 357/704 [00:02<00:01, 175.39it/s]

KL tensor(77.3005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0884, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(97.7881, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0945, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(94.0067, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0878, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(99.5742, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0965, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(115.0411, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0887, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(103.4803, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0925, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(90.0927, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0943, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(79.9301, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0937, device='cuda:0', grad_fn=<MseLossBackward0>

Epoch 1 [Train]:  53%|█████▎    | 376/704 [00:02<00:01, 177.33it/s]

KL tensor(73.3796, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0947, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(77.1472, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.1000, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(75.4251, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0886, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(74.6183, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0944, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(80.8638, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0976, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(76.5557, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0948, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(77.3074, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0954, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(85.9252, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0875, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]:  59%|█████▊    | 413/704 [00:02<00:01, 178.43it/s]

KL tensor(74.4471, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0891, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(68.5728, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0891, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(64.3134, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0935, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(68.6516, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0912, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(67.8614, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0878, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(74.4405, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0954, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(67.4960, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0899, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(64.6422, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0923, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]:  64%|██████▍   | 450/704 [00:03<00:01, 171.87it/s]

KL tensor(66.0905, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0971, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(60.4367, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0929, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(62.1012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0929, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(69.0199, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0845, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(78.2296, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0875, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(73.5634, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0972, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(62.1327, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0907, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(52.4524, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0904, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]:  69%|██████▉   | 487/704 [00:03<00:01, 176.17it/s]

KL tensor(58.7075, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0864, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(66.7986, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0928, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(52.9552, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0898, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(52.1748, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0947, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(58.6595, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0920, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(64.9110, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0994, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(65.4508, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0894, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(51.1954, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0901, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]:  74%|███████▍  | 524/704 [00:03<00:01, 176.43it/s]

KL tensor(60.9309, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0885, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(48.9024, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0884, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(51.0386, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0918, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(57.9285, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0816, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(62.2077, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0845, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(74.1168, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0872, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(63.8292, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0844, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(54.0560, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0945, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]:  80%|███████▉  | 562/704 [00:03<00:00, 173.43it/s]

KL tensor(47.9899, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0915, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(47.9785, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0899, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(48.7927, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0946, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(46.5175, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0922, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(42.0851, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0883, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(46.1006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0899, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(42.1917, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0921, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(40.8188, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0920, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]:  85%|████████▌ | 599/704 [00:03<00:00, 174.67it/s]

KL tensor(39.2185, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0946, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(44.4441, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0919, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(43.5408, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0920, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(38.5427, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0916, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(39.7483, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0930, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(43.8392, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0902, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(46.8972, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0968, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(44.3973, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0878, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]:  90%|█████████ | 635/704 [00:04<00:00, 167.57it/s]

KL tensor(40.2334, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0836, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(39.7232, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0976, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(38.6640, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0952, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(37.9365, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0878, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(39.7382, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0926, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(35.7782, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0865, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(38.4602, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0880, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(42.0533, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0917, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]:  95%|█████████▌| 669/704 [00:04<00:00, 165.61it/s]

KL tensor(40.7641, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0986, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(31.2117, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0821, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(30.6613, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0929, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(37.8088, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0894, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(41.4959, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0933, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(39.0312, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0906, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(35.1336, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0932, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(37.7396, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0883, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Train]: 100%|██████████| 704/704 [00:04<00:00, 155.75it/s]


KL tensor(30.4359, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0900, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(31.4532, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0899, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(35.1287, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0860, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(33.7848, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0866, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(30.2693, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0933, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(29.5516, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0923, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(35.5466, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0977, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(29.9934, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0938, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 1 [Validation]:   9%|▉         | 7/79 [00:00<00:00, 86.51it/s]


additional_logs are not defined for this logger
KL tensor(83.2067, device='cuda:0')
REC tensor(0.0673, device='cuda:0')
KL tensor(117.8902, device='cuda:0')
REC tensor(0.0714, device='cuda:0')
KL tensor(16.8952, device='cuda:0')
REC tensor(0.0651, device='cuda:0')
KL tensor(6.9741, device='cuda:0')
REC tensor(0.0593, device='cuda:0')
KL tensor(9.8416, device='cuda:0')
REC tensor(0.0674, device='cuda:0')
KL tensor(71.7872, device='cuda:0')
REC tensor(0.0654, device='cuda:0')
KL tensor(22.4075, device='cuda:0')
REC tensor(0.0735, device='cuda:0')
KL tensor(76.4439, device='cuda:0')
REC tensor(0.0737, device='cuda:0')
Validation loss improved from inf to 5.1322. Saving model...


Epoch 2 [Train]:   2%|▏         | 11/704 [00:00<00:06, 107.84it/s]

KL tensor(43.6302, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0943, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(45.0630, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0968, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(28.7100, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0904, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(26.2224, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0891, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(29.0208, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0900, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(38.4318, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0844, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(32.9802, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0940, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(26.3871, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0865, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:   4%|▍         | 29/704 [00:00<00:04, 149.73it/s]

KL tensor(27.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0913, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(25.7789, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0853, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(34.3419, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0930, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(34.7003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0901, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(29.1913, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0884, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(26.4931, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0880, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(27.2733, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0861, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(31.2815, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0956, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:   7%|▋         | 48/704 [00:00<00:03, 165.43it/s]

KL tensor(26.6911, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0892, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(24.2932, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0919, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(22.1365, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0921, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(23.8663, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0886, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(25.5460, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0868, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(24.6205, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0892, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(23.6583, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0859, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(26.5986, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0902, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  10%|▉         | 67/704 [00:00<00:03, 171.11it/s]

KL tensor(21.9282, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0855, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(27.1054, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0861, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(31.6000, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0887, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(27.2817, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0922, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.5618, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0949, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(23.8636, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0823, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(30.7153, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0974, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(30.5059, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0892, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  12%|█▏        | 85/704 [00:00<00:03, 167.97it/s]

KL tensor(22.5241, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0924, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.9906, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0858, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(22.0610, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0942, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.7626, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0871, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(22.6383, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0894, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.2751, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0929, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(22.7498, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0905, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(24.3764, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0925, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  14%|█▍        | 102/704 [00:00<00:03, 168.44it/s]

KL tensor(23.2449, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0955, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(24.5590, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0900, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(22.4583, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0858, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(24.9501, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0888, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(22.9827, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0927, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.1381, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0891, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.2328, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0902, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(24.3879, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0962, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  17%|█▋        | 120/704 [00:00<00:03, 170.60it/s]

KL tensor(20.9379, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0878, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(23.2857, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0885, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.7351, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0894, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.8888, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0927, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(19.9438, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0890, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(20.8592, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0867, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(22.4450, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0886, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(24.4383, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0857, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  20%|█▉        | 139/704 [00:00<00:03, 173.95it/s]

KL tensor(18.5574, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0883, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(16.9266, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0903, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.0197, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0850, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(19.6967, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0892, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(20.4571, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0908, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(19.8912, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0954, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.9120, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0886, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.9870, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0904, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  22%|██▏       | 157/704 [00:00<00:03, 174.44it/s]

KL tensor(19.7484, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0920, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(21.5046, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0952, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.9535, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0866, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.2372, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0894, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(19.4804, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0831, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(22.4130, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0901, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(20.0872, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0842, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.1826, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0913, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  25%|██▍       | 175/704 [00:01<00:03, 176.06it/s]

KL tensor(18.7540, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0826, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.4492, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0848, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.8420, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0913, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.5177, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0834, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(18.2130, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0892, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(19.1822, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0851, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.7206, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0842, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(14.8212, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0955, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  28%|██▊       | 194/704 [00:01<00:02, 177.85it/s]

KL tensor(16.3063, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0887, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.2516, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0858, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.4169, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0875, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(16.5731, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0868, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(19.9073, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0895, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.1837, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0957, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.4584, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0846, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.0604, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0892, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  30%|███       | 213/704 [00:01<00:02, 180.63it/s]

KL tensor(16.3014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0759, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.8322, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0923, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.4482, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0850, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(20.1524, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0841, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.7963, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0923, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(16.6710, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0826, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.5727, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0827, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(18.5111, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0825, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  33%|███▎      | 232/704 [00:01<00:02, 182.92it/s]

KL tensor(18.4277, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0824, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.9867, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0887, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.3649, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0933, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.2384, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0947, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.6847, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0869, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(18.2720, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0877, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.8517, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0867, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.4075, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0902, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  36%|███▌      | 251/704 [00:01<00:02, 183.04it/s]

KL tensor(17.7415, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0869, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.8283, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0847, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.0885, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0883, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(14.4891, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0856, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(15.0809, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0866, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(16.4228, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0892, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(14.7862, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0866, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.4727, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0863, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  38%|███▊      | 270/704 [00:01<00:02, 171.63it/s]

KL tensor(12.2458, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0805, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.9936, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0918, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.9602, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0869, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.8018, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0937, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.8469, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0823, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.5731, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0889, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.4003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0877, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.4880, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0914, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  41%|████      | 288/704 [00:01<00:02, 173.87it/s]

KL tensor(12.1855, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0865, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.2040, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0843, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.9670, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0888, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.4855, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0873, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.0365, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0912, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.4962, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0842, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.5479, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0858, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(17.0204, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0825, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  44%|████▎     | 307/704 [00:01<00:02, 175.98it/s]

KL tensor(12.9529, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0871, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(14.5319, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0805, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.3670, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0870, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.5821, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0837, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.1300, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0872, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.9694, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0876, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.3386, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0849, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.8460, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0910, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  46%|████▋     | 326/704 [00:01<00:02, 178.52it/s]

KL tensor(11.4353, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0866, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.5634, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0822, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(13.2387, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0933, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.1983, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0804, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.3639, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0863, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.4172, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0965, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.0643, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0899, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.3682, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0915, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Train]:  49%|████▉     | 346/704 [00:01<00:01, 182.19it/s]

KL tensor(8.1487, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0829, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.8235, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0807, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.8576, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0853, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.5167, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0848, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.4505, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0825, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.5539, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0856, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.0963, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0813, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.4595, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0880, device='cuda:0', grad_fn=<MseLossBackward0>)
KL t

Epoch 2 [Train]:  52%|█████▏    | 365/704 [00:02<00:01, 178.92it/s]

KL tensor(9.3441, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0866, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.0056, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0914, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(11.3638, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0833, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(12.2761, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0815, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.5361, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0919, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.5392, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0903, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.9357, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0807, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.7557, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0800, device='cuda:0', grad_fn=<MseLossBackward0>)
KL 

Epoch 2 [Train]:  54%|█████▍    | 383/704 [00:02<00:01, 170.86it/s]

KL tensor(10.4021, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0919, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.1910, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0801, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.3468, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0937, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.5119, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0876, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.9766, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0885, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.8577, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0842, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.6098, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0807, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.4304, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0839, device='cuda:0', grad_fn=<MseLossBackward0>)
KL te

Epoch 2 [Train]:  57%|█████▋    | 402/704 [00:02<00:01, 174.42it/s]

KL tensor(9.3689, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0853, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.2960, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0898, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.6358, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0849, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.7936, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0843, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.5583, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0887, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.2667, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0829, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(10.3486, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0813, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.2986, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0836, device='cuda:0', grad_fn=<MseLossBackward0>)
KL ten

Epoch 2 [Train]:  60%|█████▉    | 421/704 [00:02<00:01, 177.87it/s]

KL tensor(9.0100, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0831, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.6090, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0776, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.5840, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0841, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.1994, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0865, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.9556, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0867, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.6495, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0899, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.1034, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0875, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.9098, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0898, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]:  62%|██████▏   | 439/704 [00:02<00:01, 173.93it/s]

tensor(8.4981, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0821, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.4829, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0825, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.2915, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0789, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.6126, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0888, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.6527, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0874, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.0560, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0912, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(9.3675, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0923, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.9975, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0808, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6

Epoch 2 [Train]:  65%|██████▍   | 457/704 [00:02<00:01, 171.65it/s]

KL tensor(9.1743, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0837, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.5487, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0800, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.7104, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0822, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.5649, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0792, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.6421, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0870, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.5342, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0853, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.3327, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0915, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.6588, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0771, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]:  68%|██████▊   | 476/704 [00:02<00:01, 175.60it/s]

KL tensor(7.0351, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0840, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.7511, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0897, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.0721, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0835, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.2740, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0856, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.9257, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0827, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.8120, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0793, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.0320, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0916, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.8238, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0833, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]:  70%|███████   | 495/704 [00:02<00:01, 177.27it/s]

tensor(0.0799, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.9382, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0928, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.6203, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0869, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.7583, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0860, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.5696, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0832, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.3425, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0776, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.2707, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0819, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.9052, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0853, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.3067, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 2 [Train]:  73%|███████▎  | 514/704 [00:02<00:01, 177.99it/s]

tensor(0.0824, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.3476, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0884, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.3617, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0794, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.0713, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0846, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.2515, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0862, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.5354, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0814, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.3627, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0832, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.2735, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0855, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.6454, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 2 [Train]:  76%|███████▌  | 532/704 [00:03<00:01, 171.45it/s]

KL tensor(6.4244, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0786, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.9258, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0786, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.3926, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0851, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.6202, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0791, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.1239, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0845, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.1739, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0884, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.5435, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0869, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.0351, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0808, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]:  78%|███████▊  | 550/704 [00:03<00:00, 169.28it/s]

tensor(0.0808, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.4855, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0797, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.9343, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0872, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.0928, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0826, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.0444, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0778, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.8644, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0837, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.9978, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0828, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(7.1568, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0811, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.1344, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 2 [Train]:  81%|████████  | 569/704 [00:03<00:00, 172.96it/s]

tensor(4.2702, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0774, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.8014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0797, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.9531, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0807, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.4594, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0872, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.2029, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0876, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.6131, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0782, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.7377, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0817, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.9695, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0768, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5

Epoch 2 [Train]:  84%|████████▎ | 588/704 [00:03<00:00, 175.33it/s]

KL tensor(6.1451, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0749, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.2182, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0801, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.9133, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0858, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.5032, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0805, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.5541, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0858, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.6607, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0811, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.1728, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0838, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.7008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0781, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]:  86%|████████▌ | 606/704 [00:03<00:00, 175.99it/s]

KL tensor(4.7025, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0793, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.5452, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0800, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.8780, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0898, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(6.4677, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0865, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.1220, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0755, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.8926, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0885, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.9046, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0926, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.7129, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0840, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]:  91%|█████████▏| 644/704 [00:03<00:00, 181.43it/s]

KL tensor(4.4566, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0838, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.3473, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0810, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.2263, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0864, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.5382, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0882, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.3923, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0790, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.9039, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0763, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.4493, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0863, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.3859, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0786, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]:  94%|█████████▍| 663/704 [00:03<00:00, 183.38it/s]

KL tensor(3.9208, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0833, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.5891, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0884, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.5664, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0816, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.8674, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0881, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.6576, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0769, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.1357, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0823, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.4157, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0864, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.7341, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0846, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]:  97%|█████████▋| 682/704 [00:03<00:00, 183.84it/s]

KL tensor(4.2155, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0768, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.7631, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0738, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.9590, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0831, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.2563, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0801, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.9473, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0824, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.5134, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0795, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(5.1814, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0822, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.3830, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0805, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 2 [Train]: 100%|██████████| 704/704 [00:04<00:00, 174.36it/s]


KL tensor(3.5033, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0793, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.9319, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0775, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.4897, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0787, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.0364, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0782, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.5649, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0850, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 2 [Validation]:   0%|          | 0/79 [00:00<?, ?it/s]

KL tensor(2.4017, device='cuda:0')
REC tensor(0.0646, device='cuda:0')
KL tensor(2.1647, device='cuda:0')
REC tensor(0.0682, device='cuda:0')
KL tensor(0.5726, device='cuda:0')
REC tensor(0.0631, device='cuda:0')
KL tensor(0.4687, device='cuda:0')
REC tensor(0.0574, device='cuda:0')
KL tensor(0.3603, device='cuda:0')
REC tensor(0.0640, device='cuda:0')
KL tensor(2.1076, device='cuda:0')
REC tensor(0.0619, device='cuda:0')
KL tensor(0.6200, device='cuda:0')
REC tensor(0.0711, device='cuda:0')
KL tensor(2.3441, device='cuda:0')
REC tensor(0.0712, device='cuda:0')


Epoch 2 [Validation]:   9%|▉         | 7/79 [00:00<00:00, 88.12it/s]


Validation loss improved from 5.1322 to 0.1397. Saving model...


Epoch 3 [Train]:   1%|▏         | 10/704 [00:00<00:07, 96.95it/s]

KL tensor(3.1898, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0789, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.9633, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0875, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.8841, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0862, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.0643, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0831, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.9749, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0775, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.5412, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0786, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.4170, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0838, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.1189, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0790, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:   4%|▎         | 26/704 [00:00<00:05, 131.65it/s]

KL tensor(2.7925, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0780, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.6717, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0822, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.2980, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0889, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.3307, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0719, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.1454, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0886, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.3074, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0800, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.4264, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0751, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.1222, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0765, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:   6%|▌         | 43/704 [00:00<00:04, 145.53it/s]

tensor(4.2147, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0843, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.1891, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0760, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.4503, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0823, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.7796, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0831, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.3300, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0839, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.2952, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0778, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.2743, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0739, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.9364, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0864, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2

Epoch 3 [Train]:   9%|▊         | 61/704 [00:00<00:04, 158.09it/s]

KL tensor(2.7626, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0744, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.5933, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0750, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.8089, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0745, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.7481, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0786, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.9557, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0798, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.2956, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0793, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.7657, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0738, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.6749, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0745, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  11%|█         | 79/704 [00:00<00:03, 164.81it/s]

KL tensor(2.9305, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0736, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.3538, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0742, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.4019, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0760, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.4758, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0817, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.1733, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0798, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.6778, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0787, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.3946, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0787, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.9613, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0768, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  14%|█▍        | 98/704 [00:00<00:03, 170.25it/s]

KL tensor(1.8833, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0789, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.6119, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0841, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.5365, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0811, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.2068, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0759, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.1813, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0832, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.4585, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0857, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.6402, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0787, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.3167, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0789, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  19%|█▉        | 134/704 [00:00<00:03, 164.71it/s]

KL tensor(1.9716, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0751, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.9044, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0730, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.3882, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0826, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.2555, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0735, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.7878, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0802, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.1000, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0807, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.3183, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0774, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.9662, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0762, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  24%|██▍       | 171/704 [00:01<00:03, 172.31it/s]

KL tensor(1.8040, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0866, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.8443, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0798, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.7718, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0770, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.5285, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0813, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.6760, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0804, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.7447, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0841, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.6703, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0804, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.5250, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0783, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  30%|██▉       | 210/704 [00:01<00:02, 181.17it/s]

KL tensor(1.3419, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0778, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.5503, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0759, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.8747, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0796, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.5411, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0850, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.3110, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0766, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.4736, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0792, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.5823, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0815, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.3385, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0808, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  35%|███▌      | 249/704 [00:01<00:02, 181.79it/s]

KL tensor(1.4185, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0762, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.2840, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0748, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.3241, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0770, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.4149, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0745, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.1493, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0804, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.3069, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0820, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.2449, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0782, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.3823, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0774, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  38%|███▊      | 268/704 [00:01<00:02, 180.90it/s]

KL tensor(1.1620, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0716, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.9691, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0714, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.9484, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0759, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.9491, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0789, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.1256, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0769, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.8130, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.7921, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0741, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(1.1207, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0741, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  41%|████      | 287/704 [00:01<00:02, 180.44it/s]

KL tensor(0.7694, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0825, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.7709, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0762, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6800, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0764, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.7733, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0778, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.7144, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0815, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.8592, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6635, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0770, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.7847, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0743, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  43%|████▎     | 306/704 [00:01<00:02, 181.53it/s]

KL tensor(0.7219, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0755, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.8981, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0732, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.8486, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0757, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.7085, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0689, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6359, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0740, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.9719, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0755, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.8162, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0785, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6206, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0729, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  46%|████▌     | 325/704 [00:01<00:02, 182.54it/s]

KL tensor(0.6380, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0729, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6251, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0705, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6818, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0698, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6059, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0722, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6186, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0776, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.5795, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0745, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6533, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0707, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6615, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0705, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  49%|████▉     | 344/704 [00:01<00:02, 178.90it/s]

KL tensor(0.5321, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0714, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.7413, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0727, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.7048, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0795, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.5853, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0721, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4945, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0733, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.5879, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0759, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.6347, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0688, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.5130, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0724, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  52%|█████▏    | 363/704 [00:02<00:01, 179.20it/s]

KL tensor(0.4098, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0725, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.5059, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0763, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.5574, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0787, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4730, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0809, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.3828, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0703, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4789, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0687, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.5442, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0750, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0731, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  54%|█████▍    | 381/704 [00:02<00:01, 174.32it/s]

KL tensor(0.4190, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0789, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4402, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0734, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4203, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0752, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.3956, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.3506, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0690, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4719, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0733, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4240, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0723, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.3865, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0731, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  57%|█████▋    | 400/704 [00:02<00:01, 176.08it/s]

KL tensor(0.3033, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0804, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2923, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0792, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2991, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0712, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.4053, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.3926, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0723, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2960, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0722, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.3633, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0603, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.3178, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0731, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  59%|█████▉    | 418/704 [00:02<00:01, 175.12it/s]

KL tensor(0.2928, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0683, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2713, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0769, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2999, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0723, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2968, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2403, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0765, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2262, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0739, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.3066, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0744, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2679, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0673, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  62%|██████▏   | 437/704 [00:02<00:01, 178.66it/s]

KL tensor(0.2319, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0723, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2634, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2359, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0746, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2293, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2661, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0736, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2611, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0708, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2630, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0714, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2126, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0704, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  65%|██████▍   | 456/704 [00:02<00:01, 181.60it/s]

KL tensor(0.2715, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0750, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2134, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0698, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2056, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0797, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.2258, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0783, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1938, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1813, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0675, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1686, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0739, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1894, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  67%|██████▋   | 475/704 [00:02<00:01, 174.01it/s]

KL tensor(0.1542, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1512, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0759, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1634, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1558, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0801, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1484, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1439, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0645, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1402, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0761, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1606, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0705, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  70%|███████   | 493/704 [00:02<00:01, 169.53it/s]

KL tensor(0.1721, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0747, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1548, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0724, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1273, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0711, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1430, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1510, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1681, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0757, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1187, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0661, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1410, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  75%|███████▌  | 529/704 [00:03<00:01, 168.85it/s]

KL tensor(0.1001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1162, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0712, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1024, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0864, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1036, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1178, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0683, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.1004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0882, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  80%|████████  | 565/704 [00:03<00:00, 172.14it/s]

KL tensor(0.0609, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0661, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0657, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0633, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0688, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0710, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0685, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0494, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0717, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0474, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0736, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0531, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0797, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0595, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  83%|████████▎ | 583/704 [00:03<00:00, 170.56it/s]

KL tensor(0.0352, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0332, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0374, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0681, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0369, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0351, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0273, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0650, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0329, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0360, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0656, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  85%|████████▌ | 601/704 [00:03<00:00, 166.58it/s]

KL tensor(0.0196, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0774, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0188, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0189, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0259, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0736, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0205, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0678, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0244, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0196, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0695, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0164, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0701, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  88%|████████▊ | 618/704 [00:03<00:00, 161.57it/s]

KL tensor(0.0211, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0191, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0708, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0180, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0167, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0717, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0163, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0182, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0163, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0760, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0161, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0708, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  90%|█████████ | 635/704 [00:03<00:00, 159.66it/s]

KL tensor(0.0144, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0137, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0701, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0131, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0135, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0719, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0130, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0117, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0709, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0142, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0646, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0121, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  92%|█████████▏| 651/704 [00:03<00:00, 151.38it/s]

KL tensor(0.0134, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0118, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0119, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0650, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0117, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0712, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0128, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0645, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0123, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0603, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0134, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0152, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0670, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Train]:  95%|█████████▍| 667/704 [00:03<00:00, 140.53it/s]

KL tensor(0.0087, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0691, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0093, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0092, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0093, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0685, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0079, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0097, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0655, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0097, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0668, device='cuda:0', grad_fn=<MseLossBackward0>)
KL 

Epoch 3 [Train]:  97%|█████████▋| 682/704 [00:04<00:00, 134.95it/s]

tensor(0.0077, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0080, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0101, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0675, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0092, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0692, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0072, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0086, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0678, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0094, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0655, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0086, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0

Epoch 3 [Train]: 100%|██████████| 704/704 [00:04<00:00, 164.76it/s]


KL tensor(0.0056, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0067, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0065, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0065, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0074, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0067, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0056, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0062, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0549, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 3 [Validation]:   0%|          | 0/79 [00:00<?, ?it/s]

KL tensor(0.0032, device='cuda:0')
REC tensor(0.0620, device='cuda:0')


Epoch 3 [Validation]:   9%|▉         | 7/79 [00:00<00:00, 78.57it/s]

KL tensor(0.0020, device='cuda:0')
REC tensor(0.0651, device='cuda:0')
KL tensor(0.0030, device='cuda:0')
REC tensor(0.0607, device='cuda:0')
KL tensor(0.0024, device='cuda:0')
REC tensor(0.0554, device='cuda:0')
KL tensor(0.0024, device='cuda:0')
REC tensor(0.0607, device='cuda:0')
KL tensor(0.0029, device='cuda:0')
REC tensor(0.0587, device='cuda:0')
KL tensor(0.0036, device='cuda:0')
REC tensor(0.0687, device='cuda:0')
KL tensor(0.0037, device='cuda:0')
REC tensor(0.0689, device='cuda:0')





Validation loss improved from 0.1397 to 0.0003. Saving model...


Epoch 4 [Train]:   1%|          | 8/704 [00:00<00:09, 76.03it/s]

KL tensor(0.0059, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0061, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0069, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0053, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0700, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0052, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0539, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0046, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0650, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0052, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0050, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0633, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:   4%|▎         | 25/704 [00:00<00:05, 128.16it/s]

KL tensor(0.0054, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0706, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0052, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0558, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0050, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0667, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0050, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0543, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0042, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0041, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0047, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0050, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:   6%|▌         | 42/704 [00:00<00:04, 144.86it/s]

KL tensor(0.0037, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0557, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0033, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0037, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0035, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0706, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0043, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0034, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0037, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0691, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0035, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:   9%|▊         | 60/704 [00:00<00:04, 156.77it/s]

KL tensor(0.0035, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0040, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0036, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0551, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0032, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0039, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0031, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0036, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0033, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  11%|█         | 77/704 [00:00<00:03, 160.22it/s]

KL tensor(0.0028, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0602, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0027, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0660, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0034, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0029, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0661, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0029, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0031, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0031, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0030, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  13%|█▎        | 94/704 [00:00<00:03, 159.27it/s]

KL tensor(0.0028, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0025, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0025, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0025, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0026, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0029, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0678, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0024, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0028, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0541, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  16%|█▌        | 110/704 [00:00<00:03, 157.64it/s]

KL tensor(0.0025, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0020, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0708, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0024, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0692, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0022, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0019, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0022, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0024, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0021, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0645, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  18%|█▊        | 128/704 [00:00<00:03, 162.83it/s]

KL tensor(0.0022, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0020, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0684, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0019, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0675, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0019, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0021, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0022, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0021, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0022, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  21%|██        | 145/704 [00:00<00:03, 164.64it/s]

KL tensor(0.0019, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0678, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0020, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0022, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0674, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0022, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0629, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0019, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0019, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0660, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0017, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0547, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0017, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  23%|██▎       | 163/704 [00:01<00:03, 167.05it/s]

tensor(0.0650, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0016, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0016, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0017, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0018, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0018, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0619, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0020, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0633, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0017, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0656, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0017, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 4 [Train]:  26%|██▌       | 180/704 [00:01<00:03, 165.37it/s]

KL tensor(0.0015, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0016, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0675, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0017, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0016, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0015, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  28%|██▊       | 198/704 [00:01<00:03, 168.45it/s]

KL tensor(0.0016, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0667, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0015, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0015, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0567, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0015, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0016, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  31%|███       | 215/704 [00:01<00:02, 168.53it/s]

KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0579, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0660, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  33%|███▎      | 232/704 [00:01<00:02, 166.63it/s]

KL tensor(0.0014, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0561, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0013, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0717, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  35%|███▌      | 249/704 [00:01<00:02, 167.43it/s]

KL tensor(0.0011, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0716, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0011, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0011, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0717, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0674, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  38%|███▊      | 266/704 [00:01<00:02, 167.55it/s]

KL tensor(0.0012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0702, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0011, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0696, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0011, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0012, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0720, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0011, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0570, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  40%|████      | 283/704 [00:01<00:02, 165.80it/s]

KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0660, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0011, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0600, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0011, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0685, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  43%|████▎     | 301/704 [00:01<00:02, 169.26it/s]

KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0681, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0719, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0604, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0010, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0658, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  45%|████▌     | 319/704 [00:01<00:02, 170.85it/s]

tensor(0.0670, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0734, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 4 [Train]:  48%|████▊     | 337/704 [00:02<00:02, 172.33it/s]

KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0702, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0009, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  53%|█████▎    | 372/704 [00:02<00:01, 167.71it/s]

KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0578, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0572, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0695, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0701, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  58%|█████▊    | 407/704 [00:02<00:01, 168.22it/s]

KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0668, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0580, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0698, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0008, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  63%|██████▎   | 442/704 [00:02<00:01, 170.64it/s]

KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0687, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0544, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0007, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0633, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0578, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  68%|██████▊   | 479/704 [00:02<00:01, 175.86it/s]

KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0668, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  73%|███████▎  | 515/704 [00:03<00:01, 174.73it/s]

KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0600, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0705, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0006, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0587, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  76%|███████▌  | 533/704 [00:03<00:00, 174.72it/s]

KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0633, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0619, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  78%|███████▊  | 551/704 [00:03<00:00, 166.89it/s]

KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0704, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0555, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0660, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0545, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  81%|████████  | 568/704 [00:03<00:00, 167.38it/s]

KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0694, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0600, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  83%|████████▎ | 585/704 [00:03<00:00, 166.16it/s]

KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0566, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  86%|████████▌ | 602/704 [00:03<00:00, 165.70it/s]

KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0604, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0573, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0629, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0564, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0656, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  88%|████████▊ | 620/704 [00:03<00:00, 168.53it/s]

tensor(0.0673, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0650, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0693, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0693, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0565, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0552, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 4 [Train]:  90%|█████████ | 637/704 [00:03<00:00, 167.45it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0565, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0518, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  93%|█████████▎| 654/704 [00:03<00:00, 167.03it/s]

KL tensor(0.0005, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0687, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  95%|█████████▌| 671/704 [00:04<00:00, 163.45it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0690, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0579, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0561, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0695, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0593, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0549, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]:  98%|█████████▊| 688/704 [00:04<00:00, 161.73it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0556, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 4 [Train]: 100%|██████████| 704/704 [00:04<00:00, 164.61it/s]


KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0673, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(8.0049e-05, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0582, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 4 [Validation]:   0%|          | 0/79 [00:00<?, ?it/s]

KL tensor(0.0004, device='cuda:0')
REC tensor(0.0620, device='cuda:0')
KL tensor(0.0004, device='cuda:0')
REC tensor(0.0651, device='cuda:0')
KL tensor(0.0004, device='cuda:0')
REC tensor(0.0605, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0551, device='cuda:0')
KL 

Epoch 4 [Validation]:   9%|▉         | 7/79 [00:00<00:00, 88.32it/s]


tensor(0.0003, device='cuda:0')
REC tensor(0.0608, device='cuda:0')
KL tensor(0.0004, device='cuda:0')
REC tensor(0.0587, device='cuda:0')
KL tensor(0.0004, device='cuda:0')
REC tensor(0.0685, device='cuda:0')
KL tensor(0.0004, device='cuda:0')
REC tensor(0.0687, device='cuda:0')
Validation loss improved from 0.0003 to 0.0000. Saving model...


Epoch 5 [Train]:   1%|▏         | 10/704 [00:00<00:07, 98.75it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0539, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0708, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:   4%|▍         | 27/704 [00:00<00:04, 139.00it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0550, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0564, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0683, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0699, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:   6%|▌         | 43/704 [00:00<00:04, 146.96it/s]

tensor(0.0540, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0658, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0686, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0566, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0700, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 5 [Train]:   8%|▊         | 58/704 [00:00<00:04, 145.43it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0565, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  11%|█         | 76/704 [00:00<00:04, 155.76it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0593, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0548, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  13%|█▎        | 92/704 [00:00<00:03, 155.13it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0724, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  16%|█▌        | 110/704 [00:00<00:03, 162.10it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0673, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0615, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0667, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0739, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  18%|█▊        | 128/704 [00:00<00:03, 165.69it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0582, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0619, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  21%|██        | 146/704 [00:00<00:03, 168.36it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0735, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0658, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  23%|██▎       | 164/704 [00:01<00:03, 169.92it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0629, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0580, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0619, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  26%|██▌       | 181/704 [00:01<00:03, 164.24it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0718, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0557, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0688, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0711, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  28%|██▊       | 199/704 [00:01<00:02, 168.44it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0561, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0579, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0602, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  31%|███       | 217/704 [00:01<00:02, 169.56it/s]

KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0686, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0572, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  33%|███▎      | 235/704 [00:01<00:02, 172.33it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0572, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0677, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0582, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0713, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0617, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  36%|███▌      | 253/704 [00:01<00:02, 162.67it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0565, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0587, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0004, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0707, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  38%|███▊      | 270/704 [00:01<00:02, 162.62it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0678, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0698, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  41%|████      | 287/704 [00:01<00:02, 159.81it/s]

tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0642, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0688, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0

Epoch 5 [Train]:  43%|████▎     | 304/704 [00:01<00:02, 157.58it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0656, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0580, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  46%|████▌     | 322/704 [00:02<00:02, 161.40it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0562, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0661, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  48%|████▊     | 339/704 [00:02<00:02, 163.40it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0571, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0617, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  51%|█████     | 356/704 [00:02<00:02, 164.27it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0564, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0570, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  53%|█████▎    | 373/704 [00:02<00:01, 165.72it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0714, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0642, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0554, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0746, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0686, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0673, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0593, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  55%|█████▌    | 390/704 [00:02<00:01, 162.47it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0556, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0558, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0757, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0688, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  58%|█████▊    | 408/704 [00:02<00:01, 165.05it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0694, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  61%|██████    | 426/704 [00:02<00:01, 167.18it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0665, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0579, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  63%|██████▎   | 443/704 [00:02<00:01, 166.85it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0704, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0571, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  65%|██████▌   | 460/704 [00:02<00:01, 165.41it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0569, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0604, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0674, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0642, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  68%|██████▊   | 477/704 [00:02<00:01, 161.46it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0753, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0565, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0660, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0645, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  70%|███████   | 494/704 [00:03<00:01, 158.91it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0655, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0572, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  73%|███████▎  | 511/704 [00:03<00:01, 161.89it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0646, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0661, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0729, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0656, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  75%|███████▌  | 529/704 [00:03<00:01, 165.66it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0716, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0683, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  78%|███████▊  | 547/704 [00:03<00:00, 168.39it/s]

tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0668, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0544, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0717, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0

Epoch 5 [Train]:  80%|████████  | 564/704 [00:03<00:00, 165.52it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  83%|████████▎ | 581/704 [00:03<00:00, 163.61it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0524, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0567, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  85%|████████▍ | 598/704 [00:03<00:00, 162.97it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0555, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0660, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0668, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  87%|████████▋ | 615/704 [00:03<00:00, 162.65it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0560, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  90%|████████▉ | 633/704 [00:03<00:00, 167.27it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0559, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0672, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  95%|█████████▍| 668/704 [00:04<00:00, 166.08it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0683, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0571, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0569, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0615, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0747, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]:  97%|█████████▋| 685/704 [00:04<00:00, 166.19it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0656, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 5 [Train]: 100%|██████████| 704/704 [00:04<00:00, 161.96it/s]


KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(4.1634e-05, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0942, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 5 [Validation]:   0%|          | 0/79 [00:00<?, ?it/s]

KL tensor(0.0003, device='cuda:0')
REC tensor(0.0620, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0652, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0604, device='cuda:0')


Epoch 5 [Validation]:   9%|▉         | 7/79 [00:00<00:00, 80.65it/s]


KL tensor(0.0003, device='cuda:0')
REC tensor(0.0550, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0607, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0587, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0683, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0685, device='cuda:0')
Validation loss improved from 0.0000 to 0.0000. Saving model...


Epoch 6 [Train]:   1%|          | 8/704 [00:00<00:08, 79.04it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0670, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0556, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0559, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:   4%|▎         | 26/704 [00:00<00:04, 136.05it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0553, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0617, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:   6%|▌         | 40/704 [00:00<00:04, 137.48it/s]

tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0645, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 6 [Train]:   8%|▊         | 56/704 [00:00<00:04, 146.28it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0573, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0674, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0587, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0650, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  11%|█         | 74/704 [00:00<00:04, 155.79it/s]

tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0690, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0633, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0675, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 6 [Train]:  13%|█▎        | 90/704 [00:00<00:03, 153.60it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0582, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0526, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0603, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0567, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0561, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  15%|█▌        | 106/704 [00:00<00:03, 155.63it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0570, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0544, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0690, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  17%|█▋        | 123/704 [00:00<00:03, 157.74it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0559, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0619, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  20%|█▉        | 140/704 [00:00<00:03, 159.12it/s]

tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0600, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0617, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0

Epoch 6 [Train]:  22%|██▏       | 156/704 [00:01<00:03, 154.16it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0542, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0604, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0697, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0628, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  27%|██▋       | 190/704 [00:01<00:03, 160.45it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0564, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  29%|██▉       | 207/704 [00:01<00:03, 162.42it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0572, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0678, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0684, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  32%|███▏      | 224/704 [00:01<00:02, 164.02it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0633, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0561, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0535, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0555, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  34%|███▍      | 241/704 [00:01<00:02, 165.31it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0690, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0513, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0615, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0677, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0536, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  37%|███▋      | 259/704 [00:01<00:02, 167.66it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0655, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0681, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0502, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0589, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0629, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  42%|████▏     | 293/704 [00:01<00:02, 164.62it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0578, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  46%|████▋     | 327/704 [00:02<00:02, 167.21it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0675, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0690, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  52%|█████▏    | 363/704 [00:02<00:02, 170.31it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0629, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0642, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0718, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0720, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  57%|█████▋    | 399/704 [00:02<00:01, 171.09it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0536, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0658, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  59%|█████▉    | 417/704 [00:02<00:01, 166.05it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0617, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0615, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0604, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0603, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  62%|██████▏   | 436/704 [00:02<00:01, 170.44it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0681, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  64%|██████▍   | 454/704 [00:02<00:01, 166.89it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0629, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0678, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0500, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  67%|██████▋   | 471/704 [00:02<00:01, 160.49it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0677, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0642, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  69%|██████▉   | 488/704 [00:03<00:01, 161.25it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0726, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0667, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0615, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0619, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0578, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  72%|███████▏  | 505/704 [00:03<00:01, 152.90it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0681, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0570, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0646, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0548, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  74%|███████▍  | 523/704 [00:03<00:01, 159.71it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0600, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  77%|███████▋  | 540/704 [00:03<00:01, 157.52it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0723, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0705, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  79%|███████▉  | 557/704 [00:03<00:00, 159.01it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0582, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0600, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0656, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0691, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  84%|████████▍ | 591/704 [00:03<00:00, 160.41it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0517, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  89%|████████▉ | 626/704 [00:03<00:00, 165.03it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0729, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0713, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0567, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0658, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  94%|█████████▍| 661/704 [00:04<00:00, 167.43it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0661, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0667, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0690, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]:  99%|█████████▉| 697/704 [00:04<00:00, 171.04it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0573, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0693, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 6 [Train]: 100%|██████████| 704/704 [00:04<00:00, 160.99it/s]


KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0602, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0587, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0694, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(3.0726e-05, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0565, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 6 [Validation]:   9%|▉         | 7/79 [00:00<00:00, 85.67it/s]


KL tensor(0.0003, device='cuda:0')
REC tensor(0.0619, device='cuda:0')
KL tensor(0.0002, device='cuda:0')
REC tensor(0.0650, device='cuda:0')
KL tensor(0.0002, device='cuda:0')
REC tensor(0.0604, device='cuda:0')
KL tensor(0.0002, device='cuda:0')
REC tensor(0.0549, device='cuda:0')
KL tensor(0.0002, device='cuda:0')
REC tensor(0.0606, device='cuda:0')
KL tensor(0.0002, device='cuda:0')
REC tensor(0.0584, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0682, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0683, device='cuda:0')
Validation loss improved from 0.0000 to 0.0000. Saving model...


Epoch 7 [Train]:   1%|          | 7/704 [00:00<00:10, 68.00it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0677, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0587, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0661, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:   4%|▎         | 25/704 [00:00<00:05, 131.48it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0604, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0617, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0580, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:   6%|▌         | 42/704 [00:00<00:04, 146.35it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0668, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0554, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:   8%|▊         | 58/704 [00:00<00:04, 149.81it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0643, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0712, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0619, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  11%|█         | 75/704 [00:00<00:04, 155.96it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0575, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0675, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0667, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0703, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  13%|█▎        | 93/704 [00:00<00:03, 162.60it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0596, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0543, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0673, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  16%|█▌        | 110/704 [00:00<00:03, 163.41it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0589, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0573, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0677, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0600, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0686, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  18%|█▊        | 128/704 [00:00<00:03, 168.29it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0670, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0658, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0624, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0550, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  21%|██        | 145/704 [00:00<00:03, 166.14it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0557, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0550, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0646, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 7 [Train]:  23%|██▎       | 163/704 [00:01<00:03, 167.87it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0650, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0689, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0537, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  28%|██▊       | 198/704 [00:01<00:02, 169.84it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0593, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0654, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0690, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0602, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  33%|███▎      | 233/704 [00:01<00:02, 171.25it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0655, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0546, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  38%|███▊      | 269/704 [00:01<00:02, 161.56it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0573, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0566, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0691, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0657, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0612, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0762, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  43%|████▎     | 304/704 [00:01<00:02, 163.28it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0587, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0679, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0714, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0670, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0607, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  48%|████▊     | 338/704 [00:02<00:02, 166.50it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0634, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0574, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0562, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0687, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  53%|█████▎    | 372/704 [00:02<00:02, 165.66it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0581, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0623, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  55%|█████▌    | 389/704 [00:02<00:01, 165.04it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0724, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0683, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0604, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0684, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  58%|█████▊    | 406/704 [00:02<00:01, 160.96it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0494, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0644, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  60%|██████    | 423/704 [00:02<00:01, 160.10it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0563, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0518, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0602, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0665, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  63%|██████▎   | 441/704 [00:02<00:01, 164.44it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0578, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0739, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  65%|██████▌   | 458/704 [00:02<00:01, 163.47it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0660, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0719, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  67%|██████▋   | 475/704 [00:02<00:01, 156.82it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0651, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0602, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0567, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0646, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0566, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  70%|███████   | 494/704 [00:03<00:01, 164.66it/s]

tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0678, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0580, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0611, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 7 [Train]:  73%|███████▎  | 511/704 [00:03<00:01, 163.23it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0652, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0641, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  75%|███████▌  | 530/704 [00:03<00:01, 169.69it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0603, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0626, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0527, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0558, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0668, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  80%|████████  | 566/704 [00:03<00:00, 165.17it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0586, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0562, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0547, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  85%|████████▌ | 601/704 [00:03<00:00, 166.67it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0553, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0689, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0622, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0689, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  90%|█████████ | 635/704 [00:03<00:00, 165.55it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0584, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0696, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0714, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0674, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0530, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0642, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0613, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  95%|█████████▌| 669/704 [00:04<00:00, 156.96it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0665, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0583, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0685, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0534, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 7 [Train]:  97%|█████████▋| 685/704 [00:04<00:00, 153.37it/s]

tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0604, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0646, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0696, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0663, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0598, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0

Epoch 7 [Train]: 100%|██████████| 704/704 [00:04<00:00, 161.33it/s]


tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0603, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(2.7567e-05, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0959, device='cuda:0', grad_fn=<MseLossBackward0>)


Epoch 7 [Validation]:   9%|▉         | 7/79 [00:00<00:00, 83.20it/s]

KL tensor(0.0003, device='cuda:0')
REC tensor(0.0618, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0649, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0603, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0549, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0604, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0583, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0681, device='cuda:0')
KL tensor(0.0003, device='cuda:0')
REC tensor(0.0683, device='cuda:0')



Epoch 8 [Train]:   4%|▍         | 27/704 [00:00<00:04, 137.05it/s]

KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0662, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0003, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0646, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0614, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0595, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:   9%|▉         | 62/704 [00:00<00:04, 158.72it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0647, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0615, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0576, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0615, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0549, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0592, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0694, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  14%|█▍        | 98/704 [00:00<00:03, 169.60it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0656, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0658, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0630, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0633, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0640, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  19%|█▉        | 132/704 [00:00<00:03, 162.57it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0585, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0599, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0645, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0648, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  24%|██▍       | 168/704 [00:01<00:03, 168.53it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0698, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0580, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0542, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0560, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0556, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0620, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0588, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  29%|██▉       | 203/704 [00:01<00:02, 168.59it/s]

tensor(0.0673, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0617, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0659, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0593, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0597, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0569, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0

Epoch 8 [Train]:  31%|███▏      | 220/704 [00:01<00:02, 164.67it/s]

KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0669, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0571, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0625, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0578, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  36%|███▌      | 254/704 [00:01<00:02, 159.44it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0653, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0676, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0681, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0593, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0608, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0610, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0570, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  41%|████      | 289/704 [00:01<00:02, 163.20it/s]

tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0616, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0591, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0566, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0547, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0573, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0555, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0

Epoch 8 [Train]:  46%|████▌     | 324/704 [00:01<00:02, 165.96it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0633, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0568, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0617, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0631, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0577, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0569, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0601, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0655, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  51%|█████     | 359/704 [00:02<00:02, 167.34it/s]

tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0548, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0636, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0709, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0

Epoch 8 [Train]:  56%|█████▌    | 393/704 [00:02<00:01, 162.93it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0545, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0621, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0632, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0605, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0637, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0638, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0682, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0686, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  61%|██████    | 428/704 [00:02<00:01, 168.13it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0666, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0590, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0594, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0555, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0664, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0602, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  66%|██████▌   | 464/704 [00:02<00:01, 172.00it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0750, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0566, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0609, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0001, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0671, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0618, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0578, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0627, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso

Epoch 8 [Train]:  72%|███████▏  | 504/704 [00:03<00:01, 163.89it/s]

KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0649, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0655, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0639, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0635, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0646, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0655, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0680, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tensor(0.0002, device='cuda:0', grad_fn=<MeanBackward1>)
REC tensor(0.0606, device='cuda:0', grad_fn=<MseLossBackward0>)
KL tenso




KeyboardInterrupt: 

In [None]:
# First cell - Initialize model and load checkpoint
device = torch.device("cuda" if torch.cuda.is_available() else "cpu")

model = VAE(latent_dim=512).to(device)
checkpoint = torch.load(best_checkpoint_path, map_location=device)
model.load_state_dict(checkpoint)
model.eval();

In [None]:
# Second cell - Get test images
test_images = []
for batch, _ in test_loader:
    test_images.append(batch)
    if len(torch.cat(test_images)) >= 2000:
        break
test_images = torch.cat(test_images)[:2000]

In [None]:
# Third cell - Generate images
generated_images = []
batch_size = 64

with torch.no_grad():
    for i in range(0, 2000, batch_size):
        curr_batch_size = min(batch_size, 2000 - i)
        gen_batch = model.generate(curr_batch_size, device=device)
        generated_images.append(gen_batch)

generated_images = torch.cat(generated_images)

In [None]:
# Fourth cell - Compute FID
metric = FIDMetric(device)
fid_score = metric(test_images, generated_images)
print(f"FID Score: {fid_score:.2f}")

In [None]:
# Fifth cell - Visualize 16 random samples
import random
from torchvision.utils import make_grid
import matplotlib.pyplot as plt

# Get 16 random indices
indices = random.sample(range(len(generated_images)), 16)
vis_samples = generated_images[indices]

# Create and display grid
grid = make_grid(vis_samples, nrow=4, padding=2, normalize=True)
plt.figure(figsize=(6, 6))
plt.imshow(grid.cpu().permute(1, 2, 0).numpy())
plt.axis('off')
plt.title(f'Random Generated Samples (FID: {fid_score:.2f})')
plt.show()