In [5]:
import os
import glob
import random
import subprocess

import numpy as np
import pandas as pd
import h5py
import uproot
import awkward as ak

import torch
import torch.nn as nn
import torch.nn.functional as F
from torch_geometric.data import Data, Dataset, DataLoader
from torch_geometric.nn import knn_graph

import tqdm
from tqdm import tqdm

import os
import os.path as osp  # This defines 'osp'
import glob



def find_highest_branch(path, base_name):
    with uproot.open(path) as f:
        # Find keys that exactly match the base_name (not containing other variations)
        branches = [k for k in f.keys() if k.startswith(base_name + ';')]
        
        # Sort and select the highest-numbered branch
        sorted_branches = sorted(branches, key=lambda x: int(x.split(';')[-1]))
        return sorted_branches[-1] if sorted_branches else None

class CCV1(Dataset):
    r'''
    Loads trackster-level features and associations for positive/negative edge creation.
    '''

    url = '/dummy/'

    def __init__(self, root, transform=None, max_events=1e8, inp='train'):
        super(CCV1, self).__init__(root, transform)
        self.inp = inp
        self.max_events = max_events
        self.fill_data(max_events)

    def fill_data(self, max_events):
        counter = 0
        print("### Loading tracksters data")


        for path in tqdm(self.raw_paths):
            print(path)
            
            tracksters_path = find_highest_branch(path, 'tracksters')
            associations_path = find_highest_branch(path, 'associations')
            simtrack = find_highest_branch(path, 'simtrackstersCP')
            # Load tracksters features in chunks
            for array in uproot.iterate(
                f"{path}:{tracksters_path}",
                [
                    "time", "raw_energy",
                    "barycenter_x", "barycenter_y", "barycenter_z", 
                    "barycenter_eta", "barycenter_phi",
                    "EV1", "EV2", "EV3",
                    "eVector0_x", "eVector0_y", "eVector0_z",
                    "sigmaPCA1", "sigmaPCA2", "sigmaPCA3", "raw_pt", "vertices_time"
                ],
            ):

                tmp_time = array["time"]
                tmp_raw_energy = array["raw_energy"]
                tmp_bx = array["barycenter_x"]
                tmp_by = array["barycenter_y"]
                tmp_bz = array["barycenter_z"]
                tmp_beta = array["barycenter_eta"]
                tmp_bphi = array["barycenter_phi"]
                tmp_EV1 = array["EV1"]
                tmp_EV2 = array["EV2"]
                tmp_EV3 = array["EV3"]
                tmp_eV0x = array["eVector0_x"]
                tmp_eV0y = array["eVector0_y"]
                tmp_eV0z = array["eVector0_z"]
                tmp_sigma1 = array["sigmaPCA1"]
                tmp_sigma2 = array["sigmaPCA2"]
                tmp_sigma3 = array["sigmaPCA3"]
                tmp_pt = array["raw_pt"]
                tmp_vt = array["vertices_time"]
                
                
                vert_array = []
                for vert_chunk in uproot.iterate(
                    f"{path}:{simtrack}",
                    ["barycenter_x"],
                ):
                    vert_array = vert_chunk["barycenter_x"]
                    break  # Since we have a matching chunk, no need to continue
                

                # Now load the associations for the same events/chunk
                # 'tsCLUE3D_recoToSim_CP' gives association arrays like [[1,0],[0,1],...]
                # Make sure we read from the same events
                tmp_array = []
                score_array = []
                for assoc_chunk in uproot.iterate(
                    f"{path}:{associations_path}",
                    ["tsCLUE3D_recoToSim_CP", "tsCLUE3D_recoToSim_CP_score"],
                ):
                    tmp_array = assoc_chunk["tsCLUE3D_recoToSim_CP"]
                    score_array = assoc_chunk["tsCLUE3D_recoToSim_CP_score"]
                    break  # Since we have a matching chunk, no need to continue
                
                
                skim_mask = []
                for e in vert_array:
                    if len(e) >= 2:
                        skim_mask.append(True)
                    elif len(e) == 0:
                        skim_mask.append(False)

                    else:
                        skim_mask.append(False)



                tmp_time = tmp_time[skim_mask]
                tmp_raw_energy = tmp_raw_energy[skim_mask]
                tmp_bx = tmp_bx[skim_mask]
                tmp_by = tmp_by[skim_mask]
                tmp_bz = tmp_bz[skim_mask]
                tmp_beta = tmp_beta[skim_mask]
                tmp_bphi = tmp_bphi[skim_mask]
                tmp_EV1 = tmp_EV1[skim_mask]
                tmp_EV2 = tmp_EV2[skim_mask]
                tmp_EV3 = tmp_EV3[skim_mask]
                tmp_eV0x = tmp_eV0x[skim_mask]
                tmp_eV0y = tmp_eV0y[skim_mask]
                tmp_eV0z = tmp_eV0z[skim_mask]
                tmp_sigma1 = tmp_sigma1[skim_mask]
                tmp_sigma2 = tmp_sigma2[skim_mask]
                tmp_sigma3 = tmp_sigma3[skim_mask]
                tmp_array = tmp_array[skim_mask]
                tmp_pt = tmp_pt[skim_mask]
                tmp_vt = tmp_vt[skim_mask]
                score_array = score_array[skim_mask]
                
                skim_mask = []
                for e in tmp_array:
                    if 2 <= len(e):
                        skim_mask.append(True)

                    elif len(e) == 0:
                        skim_mask.append(False)

                    else:
                        skim_mask.append(False)

                        
                tmp_time = tmp_time[skim_mask]
                tmp_raw_energy = tmp_raw_energy[skim_mask]
                tmp_bx = tmp_bx[skim_mask]
                tmp_by = tmp_by[skim_mask]
                tmp_bz = tmp_bz[skim_mask]
                tmp_beta = tmp_beta[skim_mask]
                tmp_bphi = tmp_bphi[skim_mask]
                tmp_EV1 = tmp_EV1[skim_mask]
                tmp_EV2 = tmp_EV2[skim_mask]
                tmp_EV3 = tmp_EV3[skim_mask]
                tmp_eV0x = tmp_eV0x[skim_mask]
                tmp_eV0y = tmp_eV0y[skim_mask]
                tmp_eV0z = tmp_eV0z[skim_mask]
                tmp_sigma1 = tmp_sigma1[skim_mask]
                tmp_sigma2 = tmp_sigma2[skim_mask]
                tmp_sigma3 = tmp_sigma3[skim_mask]
                tmp_array = tmp_array[skim_mask]
                tmp_pt = tmp_pt[skim_mask]
                tmp_vt = tmp_vt[skim_mask]
                score_array = score_array[skim_mask]

                
                # Concatenate or initialize storage
                if counter == 0:
                    self.time = tmp_time
                    self.raw_energy = tmp_raw_energy
                    self.bx = tmp_bx
                    self.by = tmp_by
                    self.bz = tmp_bz
                    self.beta = tmp_beta
                    self.bphi = tmp_bphi
                    self.EV1 = tmp_EV1
                    self.EV2 = tmp_EV2
                    self.EV3 = tmp_EV3
                    self.eV0x = tmp_eV0x
                    self.eV0y = tmp_eV0y
                    self.eV0z = tmp_eV0z
                    self.sigma1 = tmp_sigma1
                    self.sigma2 = tmp_sigma2
                    self.sigma3 = tmp_sigma3
                    self.assoc = tmp_array
                    self.pt = tmp_pt
                    self.vt = tmp_vt
                    self.score = score_array
                else:
                    self.time = ak.concatenate((self.time, tmp_time))
                    self.raw_energy = ak.concatenate((self.raw_energy, tmp_raw_energy))
                    self.bx = ak.concatenate((self.bx, tmp_bx))
                    self.by = ak.concatenate((self.by, tmp_by))
                    self.bz = ak.concatenate((self.bz, tmp_bz))
                    self.beta = ak.concatenate((self.beta, tmp_beta))
                    self.bphi = ak.concatenate((self.bphi, tmp_bphi))
                    self.EV1 = ak.concatenate((self.EV1, tmp_EV1))
                    self.EV2 = ak.concatenate((self.EV2, tmp_EV2))
                    self.EV3 = ak.concatenate((self.EV3, tmp_EV3))
                    self.eV0x = ak.concatenate((self.eV0x, tmp_eV0x))
                    self.eV0y = ak.concatenate((self.eV0y, tmp_eV0y))
                    self.eV0z = ak.concatenate((self.eV0z, tmp_eV0z))
                    self.sigma1 = ak.concatenate((self.sigma1, tmp_sigma1))
                    self.sigma2 = ak.concatenate((self.sigma2, tmp_sigma2))
                    self.sigma3 = ak.concatenate((self.sigma3, tmp_sigma3))
                    self.assoc = ak.concatenate((self.assoc, tmp_array))
                    self.pt = ak.concatenate((self.pt, tmp_pt))
                    self.vt = ak.concatenate((self.vt, tmp_vt))
                    self.score = ak.concatenate((self.score, score_array))

                counter += len(tmp_bx)
                if counter >= max_events:
                    print(f"Reached {max_events} events!")
                    break
            if counter >= max_events:
                break

    def download(self):
        raise RuntimeError(
            f'Dataset not found. Please download it from {self.url} and move all '
            f'*.root files to {self.raw_dir}')

    def len(self):
        return len(self.time)

    @property
    def raw_file_names(self):
        raw_files = sorted(glob.glob(osp.join(self.raw_dir, '*.root')))
        return raw_files

    @property
    def processed_file_names(self):
        return []



    def get(self, idx):

        def reconstruct_array(grouped_indices):
            # Finds the maximum index and returns a 1D array listing the group for each index
            max_index = max(max(indices) for indices in grouped_indices.values())
            reconstructed = [-1] * (max_index + 1)
            for value, indices in grouped_indices.items():
                for idx2 in indices:
                    reconstructed[idx2] = value
            return reconstructed

        # Extract per-event arrays
        event_time = self.time[idx]
        event_raw_energy = self.raw_energy[idx]
        event_bx = self.bx[idx]
        event_by = self.by[idx]
        event_bz = self.bz[idx]
        event_beta = self.beta[idx]
        event_bphi = self.bphi[idx]
        event_EV1 = self.EV1[idx]
        event_EV2 = self.EV2[idx]
        event_EV3 = self.EV3[idx]
        event_eV0x = self.eV0x[idx]
        event_eV0y = self.eV0y[idx]
        event_eV0z = self.eV0z[idx]
        event_sigma1 = self.sigma1[idx]
        event_sigma2 = self.sigma2[idx]
        event_sigma3 = self.sigma3[idx]
        event_assoc = self.assoc[idx]
        event_pt = self.pt[idx]
        event_vt = self.vt[idx]
        event_score = self.score[idx]

        # Convert each to NumPy
        event_time = np.array(event_time)
        event_raw_energy = np.array(event_raw_energy)
        event_bx = np.array(event_bx)
        event_by = np.array(event_by)
        event_bz = np.array(event_bz)
        event_beta = np.array(event_beta)
        event_bphi = np.array(event_bphi)
        event_EV1 = np.array(event_EV1)
        event_EV2 = np.array(event_EV2)
        event_EV3 = np.array(event_EV3)
        event_eV0x = np.array(event_eV0x)
        event_eV0y = np.array(event_eV0y)
        event_eV0z = np.array(event_eV0z)
        event_sigma1 = np.array(event_sigma1)
        event_sigma2 = np.array(event_sigma2)
        event_sigma3 = np.array(event_sigma3)
        event_assoc = np.array(event_assoc)   # shape (N, ?)  or (N,) with nested arrays
        event_pt = np.array(event_pt)
        event_score = np.array(event_score)   # shape (N, ?)  or (N,) with nested arrays

        # Example: compute average vertex times
        avg_vt = []
        for vt in event_vt:
            vt_arr = np.array(vt)
            valid_times = vt_arr[vt_arr != -99]
            avg_vt.append(valid_times.mean() if valid_times.size else 0)
        avg_vt = np.array(avg_vt)

        # Stack trackster features
        flat_feats = np.column_stack((
            event_bx, event_by, event_bz, event_raw_energy,
            event_beta, event_bphi,
            event_EV1, event_EV2, event_EV3,
            event_eV0x, event_eV0y, event_eV0z,
            event_sigma1, event_sigma2, event_sigma3,
            event_pt
        ))
        x = torch.from_numpy(flat_feats).float()

        # Convert associations & scores to tensor
        links_tensor = torch.from_numpy(event_assoc).float()
        scores_tensor = torch.from_numpy(event_score).float()

        # --- Truncate or pad each tensor to 4 columns ---
        def ensure_four_columns(tensor):
            """
            If tensor.shape[1] > 4, slice columns to 4.
            If tensor.shape[1] < 4, repeat the last column until 4.
            If exactly 4, do nothing.
            """
            if tensor.ndim == 1:
                # If it's just shape (N,), treat that as (N,1) for column logic
                tensor = tensor.unsqueeze(1)

            nrow, ncol = tensor.shape
            if ncol > 4:
                # Truncate to first 4 columns
                tensor = tensor[:, :4]
            elif ncol < 4:
                # Repeat last column until 4
                last_col = tensor[:, -1].unsqueeze(1)  # shape (N,1)
                repeat_count = 4 - ncol
                repeated = last_col.repeat(1, repeat_count)  # shape (N, repeat_count)
                tensor = torch.cat([tensor, repeated], dim=1)  # shape (N, 4)

            return tensor

        # --- Truncate or pad each tensor to 4 columns ---
        scores_tensor = ensure_four_columns(scores_tensor)
        links_tensor = ensure_four_columns(links_tensor)

        # New association assignment based on the smallest score for each node
        total_tracksters = len(event_time)
        new_assoc = []
        for i in range(total_tracksters):
            row_scores = scores_tensor[i]   # e.g., [1.2327e-01, 8.9402e-01, 9.6672e-01, 9.9460e-01]
            row_links = links_tensor[i]     # e.g., [4., 3., 6., 8.]
            # Get index of smallest score
            min_index = torch.argmin(row_scores).item()
            # Select group id from links_tensor corresponding to that score
            group_id = int(row_links[min_index].item())
            new_assoc.append(group_id)

        # Group tracksters by the new association values
        new_assoc_groups = {}
        for i, group in enumerate(new_assoc):
            new_assoc_groups.setdefault(group, []).append(i)

        # Use your helper to reconstruct the association array from the groups
        assoc_array = reconstruct_array(new_assoc_groups)


        # Return Data object
        return Data(
            x=x,
            assoc=assoc_array,
            scores=scores_tensor,
            links=links_tensor
        )


In [None]:
ipath = "/vols/cms/mm1221/Data/mix/train/"
vpath = "/vols/cms/mm1221/Data/mix/val/"
data_train = CCV1(ipath, max_events=10000, inp='train')
data_val = CCV1(vpath, max_events=10, inp='val')

### Loading tracksters data


  0%|                                                     | 0/3 [00:00<?, ?it/s]

/vols/cms/mm1221/Data/mix/train/raw/18k.root


In [139]:
def contrastive_loss_curriculum_both(embeddings, pos_indices, group_ids, temperature=0.5, alpha=1.0):
    """
    Computes an NT-Xent style loss that blends both positive and negative mining.
    
    For each anchor i:
      - Provided positive similarity: pos_sim_orig = sim(embeddings[i], embeddings[pos_indices[i]])
      - Hard positive similarity: hard_pos_sim = min { sim(embeddings[i], embeddings[j]) : 
                                                      j != i and group_ids[j] == group_ids[i] }
      - Blended positive similarity: blended_pos = (1 - alpha) * pos_sim_orig + alpha * hard_pos_sim
      - Random negative similarity: rand_neg_sim = similarity from a randomly chosen negative (group_ids differ)
      - Hard negative similarity: hard_neg_sim = max { sim(embeddings[i], embeddings[j]) : 
                                                      group_ids[j] != group_ids[i] }
      - Blended negative similarity: blended_neg = (1 - alpha) * rand_neg_sim + alpha * hard_neg_sim
      
    The loss per anchor is then:
         loss_i = - log( exp(blended_pos/temperature) / [ exp(blended_pos/temperature) + exp(blended_neg/temperature) ] )
    
    Anchors that lack any valid positives or negatives contribute 0.
    
    Args:
        embeddings: Tensor of shape (N, D) (raw outputs; they will be normalized inside).
        pos_indices: 1D Tensor (length N) giving the index of the provided positive for each anchor.
        group_ids: 1D Tensor (length N) of group identifiers.
        temperature: Temperature scaling factor.
        alpha: Blending parameter between random and hard mining (0: use only provided/random, 1: use only hard).
        
    Returns:
        Scalar loss (mean over anchors).
    """
    # Normalize embeddings so that cosine similarity is simply the dot product.
    norm_emb = F.normalize(embeddings, p=2, dim=1)  # shape (N, D)
    # Compute full cosine similarity matrix.
    sim_matrix = norm_emb @ norm_emb.t()  # shape (N, N)
    N = embeddings.size(0)
    idx = torch.arange(N, device=embeddings.device)
    
    # --- Positives ---
    # Provided positive similarity.
    pos_sim_orig = sim_matrix[idx, pos_indices.view(-1)]
    """
    # Hard positive: consider all other indices in the same group.
    pos_mask = (group_ids.unsqueeze(1) == group_ids.unsqueeze(0))
    # Exclude self (set diagonal to False)
    pos_mask = pos_mask & ~torch.eye(N, dtype=torch.bool, device=embeddings.device)
    # For each anchor, if there are valid positives, take the minimum similarity.
    # To do that, copy sim_matrix and set invalid positions to a large number (e.g., 2.0).
    sim_matrix_pos = sim_matrix.clone()
    sim_matrix_pos[~pos_mask] = 2.0  # cosine similarity <= 1, so 2 is safe.
    hard_pos_sim, _ = sim_matrix_pos.min(dim=1)
    # If an anchor has no valid positive (should not happen if each group has >= 2 items), fallback to provided.
    valid_pos_counts = pos_mask.sum(dim=1)
    no_valid_pos = (valid_pos_counts == 0)
    hard_pos_sim = torch.where(no_valid_pos, pos_sim_orig, hard_pos_sim)
    """
    # Blended positive similarity.
    blended_pos =  pos_sim_orig 
    
    # --- Negatives ---
    # Mask for negatives: group_ids differ.
    neg_mask = (group_ids.unsqueeze(1) != group_ids.unsqueeze(0))
    valid_neg_counts = neg_mask.sum(dim=1)
    # For anchors with no valid negatives, we later set loss to 0.
    no_valid_neg = (valid_neg_counts == 0)
    
    # Random negative: for each anchor, select one random index among negatives.
    rand_vals = torch.rand(sim_matrix.shape, device=embeddings.device)
    rand_vals = rand_vals * neg_mask.float() - (1 - neg_mask.float())
    rand_neg_indices = torch.argmax(rand_vals, dim=1)
    rand_neg_sim = sim_matrix[idx, rand_neg_indices]
    
    # Hard negative: among all negatives, choose the one with maximum similarity.
    sim_matrix_neg = sim_matrix.masked_fill(~neg_mask, -float('inf'))
    hard_neg_sim, _ = sim_matrix_neg.max(dim=1)
    # For anchors with no valid negatives, use -1.
    hard_neg_sim = torch.where(no_valid_neg, torch.tensor(-1.0, device=embeddings.device), hard_neg_sim)
    
    # Blended negative similarity.
    blended_neg = (1 - alpha) * rand_neg_sim + alpha * hard_neg_sim
    
    # --- Loss Computation ---
    loss = -torch.log(
    torch.exp(blended_pos / temperature) / 
    (torch.exp(blended_pos / temperature) + torch.exp(blended_neg / temperature)))
    # For anchors with no valid negatives, set loss to 0.
    loss = loss.masked_fill(no_valid_neg, 0.0)
    
    return loss.mean()

def contrastive_loss_curriculum(embeddings, group_ids, temperature=0.1, alpha=1.0):
    """
    Curriculum loss that uses both positive and negative blending.
    
    Delegates to contrastive_loss_curriculum_both.
    
    Args:
        embeddings: Tensor of shape (N, D).
        pos_indices: 1D Tensor (length N).
        group_ids: 1D Tensor (length N).
        temperature: Temperature scaling factor.
        alpha: Blending parameter.
        
    Returns:
        Scalar loss.
    """
    return contrastive_loss_curriculum_both(embeddings, group_ids, temperature, alpha)




#################################
# Training and Testing Functions
#################################

def train_new(train_loader, model, optimizer, device, k_value, alpha):
    model.train()
    total_loss = torch.zeros(1, device=device)
    for data in tqdm(train_loader, desc="Training"):
        data = data.to(device)
        optimizer.zero_grad()
        
        # Convert data.assoc to tensor if needed.
        if isinstance(data.assoc, list):
            if isinstance(data.assoc[0], list):
                assoc_tensor = torch.cat([torch.tensor(a, dtype=torch.int64, device=data.x.device)
                                          for a in data.assoc])
            else:
                assoc_tensor = torch.tensor(data.assoc, device=data.x.device)
        else:
            assoc_tensor = data.assoc

        edge_index = knn_graph(data.x[:, :3], k=k_value, batch=data.x_batch)
        embeddings, _ = model(data.x, edge_index, data.x_batch)
        
        # Partition batch by event.
        batch_np = data.x_batch.detach().cpu().numpy()
        _, counts = np.unique(batch_np, return_counts=True)
        
        loss_event_total = torch.zeros(1, device=device)
        start_idx = 0
        for count in counts:
            end_idx = start_idx + count
            event_embeddings = embeddings[start_idx:end_idx]
            event_group_ids = assoc_tensor[start_idx:end_idx]
            event_pos_indices = data.x_pe[start_idx:end_idx, 1].view(-1)
            loss_event = contrastive_loss_curriculum(event_embeddings, event_pos_indices,
                                                     event_group_ids, temperature=0.1, alpha=alpha)
            loss_event_total += loss_event
            start_idx = end_idx
        
        loss = loss_event_total / len(counts)
        loss.backward()
        total_loss += loss
        optimizer.step()
    return total_loss / len(train_loader.dataset)

@torch.no_grad()
def test_new(test_loader, model, device, k_value, alpha):
    model.eval()
    total_loss = torch.zeros(1, device=device)
    for data in tqdm(test_loader, desc="Validation"):
        data = data.to(device)
        
        if isinstance(data.assoc, list):
            if isinstance(data.assoc[0], list):
                assoc_tensor = torch.cat([torch.tensor(a, dtype=torch.int64, device=data.x.device)
                                          for a in data.assoc])
            else:
                assoc_tensor = torch.tensor(data.assoc, device=data.x.device)
        else:
            assoc_tensor = data.assoc
        
        edge_index = knn_graph(data.x[:, :3], k=k_value, batch=data.x_batch)
        embeddings, _ = model(data.x, edge_index, data.x_batch)
        
        batch_np = data.x_batch.detach().cpu().numpy()
        _, counts = np.unique(batch_np, return_counts=True)
        
        loss_event_total = torch.zeros(1, device=device)
        start_idx = 0
        for count in counts:
            end_idx = start_idx + count
            event_embeddings = embeddings[start_idx:end_idx]
            event_group_ids = assoc_tensor[start_idx:end_idx]
            event_pos_indices = data.x_pe[start_idx:end_idx, 1].view(-1)
            loss_event = contrastive_loss_curriculum(event_embeddings, event_pos_indices,
                                                     event_group_ids, temperature=0.1, alpha=alpha)
            loss_event_total += loss_event
            start_idx = end_idx
        total_loss += loss_event_total / len(counts)
    return total_loss / len(test_loader.dataset)


In [137]:
import torch
import torch.nn as nn
import torch.nn.functional as F

from torch_geometric.data import Data
from torch_geometric.nn import knn_graph



class CustomStaticEdgeConv(nn.Module):
    def __init__(self, nn_module):
        super(CustomStaticEdgeConv, self).__init__()
        self.nn_module = nn_module

    def forward(self, x, edge_index):
        """
        Args:
            x (torch.Tensor): Node features of shape (N, F).
            edge_index (torch.Tensor): Predefined edges [2, E], where E is the number of edges.

        Returns:
            torch.Tensor: Node features after static edge aggregation.
        """
        row, col = edge_index  # Extract row (source) and col (target) nodes
        x_center = x[row]
        x_neighbor = x[col]

        # Compute edge features (relative)
        edge_features = torch.cat([x_center, x_neighbor - x_center], dim=-1)
        edge_features = self.nn_module(edge_features)

        # Aggregate features back to nodes
        num_nodes = x.size(0)
        node_features = torch.zeros(num_nodes, edge_features.size(-1), device=x.device)
        node_features.index_add_(0, row, edge_features)

        # Normalization (Divide by node degrees)
        counts = torch.bincount(row, minlength=num_nodes).clamp(min=1).view(-1, 1)
        node_features = node_features / counts

        return node_features

class Net(nn.Module):
    def __init__(self, hidden_dim=64, num_layers=4, dropout=0.3, contrastive_dim=8, heads=4):
        """
        Initializes the neural network with alternating StaticEdgeConv and GAT layers.

        Args:
            hidden_dim (int): Dimension of hidden layers.
            num_layers (int): Total number of convolutional layers (both StaticEdgeConv and GAT).
            dropout (float): Dropout rate.
            contrastive_dim (int): Dimension of the contrastive output.
            heads (int): Number of attention heads in GAT layers.
        """
        super(Net, self).__init__()
        self.hidden_dim = hidden_dim
        self.num_layers = num_layers
        self.dropout = dropout
        self.contrastive_dim = contrastive_dim
        self.heads = heads

        # Input encoder
        self.lc_encode = nn.Sequential(
            nn.Linear(16, hidden_dim),
            nn.ELU(),
            nn.Linear(hidden_dim, hidden_dim),
            nn.ELU()
        )

        # Define the network's convolutional layers, alternating between StaticEdgeConv and GAT
        self.convs = nn.ModuleList()
        for layer_idx in range(num_layers):
            conv = CustomStaticEdgeConv(
                nn.Sequential(
                    nn.Linear(2 * hidden_dim, hidden_dim),
                    nn.ELU(),
                    nn.BatchNorm1d(hidden_dim),
                    nn.Dropout(p=dropout)
                )
            )
            self.convs.append(conv)

        # Output layer
        self.output = nn.Sequential(
            nn.Linear(hidden_dim, 64),
            nn.ELU(),
            nn.Dropout(p=dropout),
            nn.Linear(64, 32),
            nn.ELU(),
            nn.Dropout(p=dropout),
            nn.Linear(32, contrastive_dim)
        )

    def forward(self, x, edge_index, batch):
        """
        Forward pass of the network.

        Args:
            x (torch.Tensor): Input node features of shape (N, 15).
            edge_index (torch.Tensor): Edge indices of shape (2, E).
            batch (torch.Tensor): Batch vector.

        Returns:
            torch.Tensor: Output features after processing.
            torch.Tensor: Batch vector.
        """
        # Input encoding
        x_lc_enc = self.lc_encode(x)  # Shape: (N, hidden_dim)

        # Apply convolutional layers with residual connections
        feats = x_lc_enc
        for idx, conv in enumerate(self.convs):
            feats = conv(feats, edge_index) + feats  # Residual connection

        # Final output
        out = self.output(feats)
        return out, batch



In [138]:
print("Instantiating model...")
# Instantiate model.

# Set device.
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
print("Loading data...")
model = Net(
    hidden_dim=128,
    num_layers=4,
    dropout=0.3,
    contrastive_dim=128
).to(device)

k_value = 24
BS = 12

# Setup optimizer and scheduler.
optimizer = torch.optim.Adam(model.parameters(), lr=0.001)
scheduler = torch.optim.lr_scheduler.StepLR(optimizer, step_size=100, gamma=0.5)

# Create DataLoaders.
train_loader = DataLoader(data_train, batch_size=BS, shuffle=False, follow_batch=['x'])
val_loader = DataLoader(data_val, batch_size=BS, shuffle=False, follow_batch=['x'])

# Setup output directory.
output_dir = '/vols/cms/mm1221/hgcal/Mixed/Track/NegativeMining/runs/SEC/Allk4/'
if not os.path.exists(output_dir):
    os.makedirs(output_dir)
best_val_loss = float('inf')
train_losses = []
val_losses = []
patience = 300
no_improvement_epochs = 0

print("Starting full training with curriculum for hard negative mining...")

epochs = 300
for epoch in range(epochs):
    # For epochs 1 to 150, gradually increase alpha from 0 to 1.
    # From epoch 151 onward, set alpha = 1 (fully hard negatives).
    if epoch < 75:
        alpha = 0
        alpha2 = 0
    elif epoch < 150:
        alpha = (epoch + 1) / 75
        alpha2 = 1.0
    else:
        alpha = 1.0
        slpha2 = 1.0

    print(f"Epoch {epoch+1}/{epochs} | Alpha: {alpha:.2f}")
    train_loss = train_new(train_loader, model, optimizer, device, k_value, alpha)
    val_loss = test_new(val_loader, model, device, k_value, alpha2)

    train_losses.append(train_loss.item())
    val_losses.append(val_loss.item())
    scheduler.step()

    # Save best model if validation loss improves.
    if val_loss < best_val_loss:
        best_val_loss = val_loss
        no_improvement_epochs = 0
        torch.save(model.state_dict(), os.path.join(output_dir, 'best_model.pt'))
    else:
        no_improvement_epochs += 1

    # Save intermediate checkpoint.
    state_dicts = {'model': model.state_dict(),
                   'opt': optimizer.state_dict(),
                   'lr': scheduler.state_dict()}
    torch.save(state_dicts, os.path.join(output_dir, f'epoch-{epoch+1}.pt'))

    print(f"Epoch {epoch+1}/{epochs} - Train Loss: {train_loss.item():.8f}, Validation Loss: {val_loss.item():.8f}")
    if no_improvement_epochs >= patience:
        print(f"Early stopping triggered. No improvement for {patience} epochs.")
        break

# Save training history.
import pandas as pd
results_df = pd.DataFrame({
    'epoch': list(range(1, len(train_losses) + 1)),
    'train_loss': train_losses,
    'val_loss': val_losses
})
results_df.to_csv(os.path.join(output_dir, 'continued_training_loss.csv'), index=False)
print(f"Saved loss curves to {os.path.join(output_dir, 'continued_training_loss.csv')}")

# Save final model.
torch.save(model.state_dict(), os.path.join(output_dir, 'final_model.pt'))
print("Training complete. Final model saved.")


Instantiating model...
Loading data...
Starting full training with curriculum for hard negative mining...
Epoch 1/300 | Alpha: 0.00


Training:   0%|                                                                                                                                                                    | 0/1352 [00:00<?, ?it/s]

neg 

Training:   0%|                                                                                                                                                            | 1/1352 [00:00<06:37,  3.40it/s]

tensor(0.7296, grad_fn=<MeanBackward0>)
pos tensor(0.4235, grad_fn=<MeanBackward0>)
neg tensor(0.7260, grad_fn=<MeanBackward0>)
pos tensor(0.5304, grad_fn=<MeanBackward0>)
neg tensor(0.7224, grad_fn=<MeanBackward0>)
pos tensor(0.5010, grad_fn=<MeanBackward0>)
neg tensor(0.6854, grad_fn=<MeanBackward0>)
pos tensor(0.6735, grad_fn=<MeanBackward0>)
neg tensor(0.6033, grad_fn=<MeanBackward0>)
pos tensor(0.6980, grad_fn=<MeanBackward0>)
neg tensor(0.7183, grad_fn=<MeanBackward0>)
pos tensor(0.5265, grad_fn=<MeanBackward0>)
neg tensor(0.5805, grad_fn=<MeanBackward0>)
pos tensor(0.5845, grad_fn=<MeanBackward0>)
neg tensor(0.7098, grad_fn=<MeanBackward0>)
pos tensor(0.5185, grad_fn=<MeanBackward0>)
neg tensor(0.6772, grad_fn=<MeanBackward0>)
pos tensor(0.4768, grad_fn=<MeanBackward0>)
neg tensor(0.7543, grad_fn=<MeanBackward0>)
pos tensor(0.5701, grad_fn=<MeanBackward0>)
neg tensor(0.7026, grad_fn=<MeanBackward0>)
pos tensor(0.4764, grad_fn=<MeanBackward0>)
neg tensor(0.7684, grad_fn=<MeanBack

Training:   0%|▏                                                                                                                                                           | 2/1352 [00:00<05:41,  3.96it/s]

neg tensor(0.7864, grad_fn=<MeanBackward0>)
pos tensor(0.5707, grad_fn=<MeanBackward0>)
neg tensor(0.7876, grad_fn=<MeanBackward0>)
pos tensor(0.7718, grad_fn=<MeanBackward0>)
neg tensor(0.6878, grad_fn=<MeanBackward0>)
pos tensor(0.6624, grad_fn=<MeanBackward0>)
neg tensor(0.8151, grad_fn=<MeanBackward0>)
pos tensor(0.5860, grad_fn=<MeanBackward0>)
neg tensor(0.6279, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.7548, grad_fn=<MeanBackward0>)
pos tensor(0.5670, grad_fn=<MeanBackward0>)
neg tensor(0.8388, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.7882, grad_fn=<MeanBackward0>)
pos tensor(0.6189, grad_fn=<MeanBackward0>)
neg tensor(0.7890, grad_fn=<MeanBackward0>)
pos tensor(0.6215, grad_fn=<MeanBackward0>)
neg tensor(0.6884, grad_fn=<MeanBackward0>)
pos tensor(0.6054, grad_fn=<MeanBackward0>)
neg tensor(0.7797, grad_fn=<MeanBackward0>)
pos tensor(0.5824, grad_fn=<MeanBackward0>)
neg tensor(0.7251, grad_fn=<MeanBack

Training:   0%|▎                                                                                                                                                           | 3/1352 [00:00<05:27,  4.12it/s]

neg tensor(0.7830, grad_fn=<MeanBackward0>)
pos tensor(0.6719, grad_fn=<MeanBackward0>)
neg tensor(0.6887, grad_fn=<MeanBackward0>)
pos tensor(0.6445, grad_fn=<MeanBackward0>)
neg tensor(0.7819, grad_fn=<MeanBackward0>)
pos tensor(0.6349, grad_fn=<MeanBackward0>)
neg tensor(0.7943, grad_fn=<MeanBackward0>)
pos tensor(0.6525, grad_fn=<MeanBackward0>)
neg tensor(0.7516, grad_fn=<MeanBackward0>)
pos tensor(0.7037, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBackward0>)
pos tensor(0.7213, grad_fn=<MeanBackward0>)
neg tensor(0.7870, grad_fn=<MeanBackward0>)
pos tensor(0.6818, grad_fn=<MeanBackward0>)
neg tensor(0.7996, grad_fn=<MeanBackward0>)
pos tensor(0.7045, grad_fn=<MeanBackward0>)
neg tensor(0.7973, grad_fn=<MeanBackward0>)
pos tensor(0.7129, grad_fn=<MeanBackward0>)
neg tensor(0.7751, grad_fn=<MeanBackward0>)
pos tensor(0.7577, grad_fn=<MeanBackward0>)
neg tensor(0.7890, grad_fn=<MeanBackward0>)
pos tensor(0.6357, grad_fn=<MeanBackward0>)
neg tensor(0.8465, grad_fn=<MeanBac

Training:   0%|▍                                                                                                                                                           | 4/1352 [00:01<05:46,  3.89it/s]

neg tensor(0.7953, grad_fn=<MeanBackward0>)
pos tensor(0.7410, grad_fn=<MeanBackward0>)
neg tensor(0.8334, grad_fn=<MeanBackward0>)
pos tensor(0.6574, grad_fn=<MeanBackward0>)
neg tensor(0.7540, grad_fn=<MeanBackward0>)
pos tensor(0.7204, grad_fn=<MeanBackward0>)
neg tensor(0.8341, grad_fn=<MeanBackward0>)
pos tensor(0.6826, grad_fn=<MeanBackward0>)
neg tensor(0.8383, grad_fn=<MeanBackward0>)
pos tensor(0.6344, grad_fn=<MeanBackward0>)
neg tensor(0.8469, grad_fn=<MeanBackward0>)
pos tensor(0.6936, grad_fn=<MeanBackward0>)
neg tensor(0.8438, grad_fn=<MeanBackward0>)
pos tensor(0.7469, grad_fn=<MeanBackward0>)
neg tensor(0.8387, grad_fn=<MeanBackward0>)
pos tensor(0.7434, grad_fn=<MeanBackward0>)
neg tensor(0.8287, grad_fn=<MeanBackward0>)
pos tensor(0.6958, grad_fn=<MeanBackward0>)
neg tensor(0.8155, grad_fn=<MeanBackward0>)
pos tensor(0.7311, grad_fn=<MeanBackward0>)
neg tensor(0.8534, grad_fn=<MeanBackward0>)
pos tensor(0.6525, grad_fn=<MeanBackward0>)
neg tensor(0.5950, grad_fn=<Mean

Training:   0%|▌                                                                                                                                                           | 5/1352 [00:01<05:09,  4.35it/s]

neg tensor(0.7802, grad_fn=<MeanBackward0>)
pos tensor(0.6640, grad_fn=<MeanBackward0>)
neg tensor(0.8238, grad_fn=<MeanBackward0>)
pos tensor(0.6724, grad_fn=<MeanBackward0>)
neg tensor(0.8037, grad_fn=<MeanBackward0>)
pos tensor(0.8117, grad_fn=<MeanBackward0>)
neg tensor(0.7677, grad_fn=<MeanBackward0>)
pos tensor(0.6898, grad_fn=<MeanBackward0>)
neg tensor(0.8433, grad_fn=<MeanBackward0>)
pos tensor(0.7305, grad_fn=<MeanBackward0>)
neg tensor(0.8185, grad_fn=<MeanBackward0>)
pos tensor(0.6829, grad_fn=<MeanBackward0>)
neg tensor(0.8315, grad_fn=<MeanBackward0>)
pos tensor(0.7291, grad_fn=<MeanBackward0>)
neg tensor(0.7244, grad_fn=<MeanBackward0>)
pos tensor(0.6146, grad_fn=<MeanBackward0>)
neg tensor(0.7993, grad_fn=<MeanBackward0>)
pos tensor(0.7987, grad_fn=<MeanBackward0>)
neg tensor(0.8058, grad_fn=<MeanBackward0>)
pos tensor(0.6308, grad_fn=<MeanBackward0>)
neg tensor(0.8181, grad_fn=<MeanBackward0>)
pos tensor(0.7392, grad_fn=<MeanBackward0>)
neg tensor(0.6843, grad_fn=<Mean

Training:   0%|▋                                                                                                                                                           | 6/1352 [00:01<04:58,  4.51it/s]

neg tensor(0.8651, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.6378, grad_fn=<MeanBackward0>)
pos tensor(0.8487, grad_fn=<MeanBackward0>)
neg tensor(0.8649, grad_fn=<MeanBackward0>)
pos tensor(0.7637, grad_fn=<MeanBackward0>)
neg tensor(0.8583, grad_fn=<MeanBackward0>)
pos tensor(0.6597, grad_fn=<MeanBackward0>)
neg tensor(0.8298, grad_fn=<MeanBackward0>)
pos tensor(0.6968, grad_fn=<MeanBackward0>)
neg tensor(0.8531, grad_fn=<MeanBackward0>)
pos tensor(0.7299, grad_fn=<MeanBackward0>)
neg tensor(0.7527, grad_fn=<MeanBackward0>)
pos tensor(0.7723, grad_fn=<MeanBackward0>)
neg tensor(0.7134, grad_fn=<MeanBackward0>)
pos tensor(0.6588, grad_fn=<MeanBackward0>)
neg tensor(0.8223, grad_fn=<MeanBackward0>)
pos tensor(0.7830, grad_fn=<MeanBackward0>)
neg tensor(0.7604, grad_fn=<MeanBackward0>)
pos tensor(0.7989, grad_fn=<MeanBackward0>)
neg tensor(0.8100, grad_fn=<MeanBackward0>)
pos tensor(0.7232, grad_fn=<MeanBackward0>)


Training:   1%|▊                                                                                                                                                           | 7/1352 [00:01<05:11,  4.31it/s]

neg tensor(0.8302, grad_fn=<MeanBackward0>)
pos tensor(0.8467, grad_fn=<MeanBackward0>)
neg tensor(0.8678, grad_fn=<MeanBackward0>)
pos tensor(0.7078, grad_fn=<MeanBackward0>)
neg tensor(0.8527, grad_fn=<MeanBackward0>)
pos tensor(0.7129, grad_fn=<MeanBackward0>)
neg tensor(0.8538, grad_fn=<MeanBackward0>)
pos tensor(0.6952, grad_fn=<MeanBackward0>)
neg tensor(-0.1435, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8624, grad_fn=<MeanBackward0>)
pos tensor(0.7896, grad_fn=<MeanBackward0>)
neg tensor(0.7071, grad_fn=<MeanBackward0>)
pos tensor(0.7483, grad_fn=<MeanBackward0>)
neg tensor(0.8436, grad_fn=<MeanBackward0>)
pos tensor(0.7176, grad_fn=<MeanBackward0>)
neg tensor(0.8635, grad_fn=<MeanBackward0>)
pos tensor(0.7295, grad_fn=<MeanBackward0>)
neg tensor(0.5373, grad_fn=<MeanBackward0>)
pos tensor(0.8146, grad_fn=<MeanBackward0>)
neg tensor(0.8541, grad_fn=<MeanBackward0>)
pos tensor(0.7302, grad_fn=<MeanBackward0>)
neg tensor(0.8251, grad_fn=<Mea

Training:   1%|▉                                                                                                                                                           | 8/1352 [00:01<05:20,  4.19it/s]

neg tensor(0.1619, grad_fn=<MeanBackward0>)
pos tensor(0.8499, grad_fn=<MeanBackward0>)
neg tensor(0.6714, grad_fn=<MeanBackward0>)
pos tensor(0.7670, grad_fn=<MeanBackward0>)
neg tensor(0.8428, grad_fn=<MeanBackward0>)
pos tensor(0.7491, grad_fn=<MeanBackward0>)
neg tensor(0.8482, grad_fn=<MeanBackward0>)
pos tensor(0.7261, grad_fn=<MeanBackward0>)
neg tensor(0.8795, grad_fn=<MeanBackward0>)
pos tensor(0.7626, grad_fn=<MeanBackward0>)
neg tensor(0.8207, grad_fn=<MeanBackward0>)
pos tensor(0.7587, grad_fn=<MeanBackward0>)
neg tensor(0.8715, grad_fn=<MeanBackward0>)
pos tensor(0.7220, grad_fn=<MeanBackward0>)
neg tensor(0.8505, grad_fn=<MeanBackward0>)
pos tensor(0.7362, grad_fn=<MeanBackward0>)
neg tensor(0.8607, grad_fn=<MeanBackward0>)
pos tensor(0.7439, grad_fn=<MeanBackward0>)
neg tensor(0.8094, grad_fn=<MeanBackward0>)
pos tensor(0.8014, grad_fn=<MeanBackward0>)
neg tensor(0.8633, grad_fn=<MeanBackward0>)
pos tensor(0.8130, grad_fn=<MeanBackward0>)
neg tensor(0.8730, grad_fn=<Mean

Training:   1%|█                                                                                                                                                           | 9/1352 [00:02<05:01,  4.45it/s]

neg tensor(0.8652, grad_fn=<MeanBackward0>)
pos tensor(0.7346, grad_fn=<MeanBackward0>)
neg tensor(0.8547, grad_fn=<MeanBackward0>)
pos tensor(0.8145, grad_fn=<MeanBackward0>)
neg tensor(0.7441, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8598, grad_fn=<MeanBackward0>)
pos tensor(0.7483, grad_fn=<MeanBackward0>)
neg tensor(0.8303, grad_fn=<MeanBackward0>)
pos tensor(0.7719, grad_fn=<MeanBackward0>)
neg tensor(0.8754, grad_fn=<MeanBackward0>)
pos tensor(0.7981, grad_fn=<MeanBackward0>)
neg tensor(0.8409, grad_fn=<MeanBackward0>)
pos tensor(0.7110, grad_fn=<MeanBackward0>)
neg tensor(0.8384, grad_fn=<MeanBackward0>)
pos tensor(0.7710, grad_fn=<MeanBackward0>)
neg tensor(0.7795, grad_fn=<MeanBackward0>)
pos tensor(0.9155, grad_fn=<MeanBackward0>)
neg tensor(0.8282, grad_fn=<MeanBackward0>)
pos tensor(0.7103, grad_fn=<MeanBackward0>)
neg tensor(0.7132, grad_fn=<MeanBackward0>)
pos tensor(0.8173, grad_fn=<MeanBackward0>)
neg tensor(0.8368, grad_fn=<Mean

Training:   1%|█▏                                                                                                                                                         | 10/1352 [00:02<05:03,  4.42it/s]

neg tensor(0.8462, grad_fn=<MeanBackward0>)
pos tensor(0.8300, grad_fn=<MeanBackward0>)
neg tensor(0.8862, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8718, grad_fn=<MeanBackward0>)
pos tensor(0.8002, grad_fn=<MeanBackward0>)
neg tensor(0.8865, grad_fn=<MeanBackward0>)
pos tensor(0.7872, grad_fn=<MeanBackward0>)
neg tensor(0.8245, grad_fn=<MeanBackward0>)
pos tensor(0.7670, grad_fn=<MeanBackward0>)
neg tensor(0.8538, grad_fn=<MeanBackward0>)
pos tensor(0.7960, grad_fn=<MeanBackward0>)
neg tensor(0.8293, grad_fn=<MeanBackward0>)
pos tensor(0.7730, grad_fn=<MeanBackward0>)
neg tensor(0.8627, grad_fn=<MeanBackward0>)
pos tensor(0.7893, grad_fn=<MeanBackward0>)
neg tensor(0.8429, grad_fn=<MeanBackward0>)
pos tensor(0.7236, grad_fn=<MeanBackward0>)
neg tensor(0.3070, grad_fn=<MeanBackward0>)
pos tensor(0.6980, grad_fn=<MeanBackward0>)
neg tensor(0.8756, grad_fn=<MeanBackward0>)
pos tensor(0.7277, grad_fn=<MeanBackward0>)
neg tensor(0.8265, grad_fn=<Mean

Training:   1%|█▎                                                                                                                                                         | 11/1352 [00:02<04:54,  4.55it/s]

neg tensor(0.8235, grad_fn=<MeanBackward0>)
pos tensor(0.7489, grad_fn=<MeanBackward0>)
neg tensor(0.8770, grad_fn=<MeanBackward0>)
pos tensor(0.7759, grad_fn=<MeanBackward0>)
neg tensor(0.7682, grad_fn=<MeanBackward0>)
pos tensor(0.9057, grad_fn=<MeanBackward0>)
neg tensor(0.8787, grad_fn=<MeanBackward0>)
pos tensor(0.8519, grad_fn=<MeanBackward0>)
neg tensor(0.8823, grad_fn=<MeanBackward0>)
pos tensor(0.7842, grad_fn=<MeanBackward0>)
neg tensor(0.8719, grad_fn=<MeanBackward0>)
pos tensor(0.7765, grad_fn=<MeanBackward0>)
neg tensor(0.7875, grad_fn=<MeanBackward0>)
pos tensor(0.8799, grad_fn=<MeanBackward0>)
neg tensor(0.8325, grad_fn=<MeanBackward0>)
pos tensor(0.7359, grad_fn=<MeanBackward0>)
neg tensor(0.8569, grad_fn=<MeanBackward0>)
pos tensor(0.8410, grad_fn=<MeanBackward0>)
neg tensor(0.8593, grad_fn=<MeanBackward0>)
pos tensor(0.8883, grad_fn=<MeanBackward0>)
neg tensor(0.8487, grad_fn=<MeanBackward0>)
pos tensor(0.7328, grad_fn=<MeanBackward0>)
neg tensor(0.8924, grad_fn=<Mean

Training:   1%|█▍                                                                                                                                                         | 12/1352 [00:02<05:03,  4.41it/s]

neg tensor(0.8852, grad_fn=<MeanBackward0>)
pos tensor(0.7453, grad_fn=<MeanBackward0>)
neg tensor(0.8952, grad_fn=<MeanBackward0>)
pos tensor(0.8326, grad_fn=<MeanBackward0>)
neg tensor(0.9069, grad_fn=<MeanBackward0>)
pos tensor(0.8150, grad_fn=<MeanBackward0>)
neg tensor(0.8323, grad_fn=<MeanBackward0>)
pos tensor(0.8768, grad_fn=<MeanBackward0>)
neg tensor(0.8875, grad_fn=<MeanBackward0>)
pos tensor(0.8052, grad_fn=<MeanBackward0>)
neg tensor(0.8199, grad_fn=<MeanBackward0>)
pos tensor(0.7766, grad_fn=<MeanBackward0>)
neg tensor(0.8514, grad_fn=<MeanBackward0>)
pos tensor(0.7873, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBackward0>)
pos tensor(0.6763, grad_fn=<MeanBackward0>)
neg tensor(0.6478, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8754, grad_fn=<MeanBackward0>)
pos tensor(0.7668, grad_fn=<MeanBackward0>)
neg tensor(0.8891, grad_fn=<MeanBackward0>)
pos tensor(0.8529, grad_fn=<MeanBackward0>)
neg tensor(0.8644, grad_fn=<MeanBac

Training:   1%|█▍                                                                                                                                                         | 13/1352 [00:03<05:04,  4.39it/s]

neg tensor(0.8982, grad_fn=<MeanBackward0>)
pos tensor(0.7883, grad_fn=<MeanBackward0>)
neg tensor(0.8982, grad_fn=<MeanBackward0>)
pos tensor(0.7937, grad_fn=<MeanBackward0>)
neg tensor(0.2253, grad_fn=<MeanBackward0>)
pos tensor(0.7718, grad_fn=<MeanBackward0>)
neg tensor(0.8753, grad_fn=<MeanBackward0>)
pos tensor(0.9234, grad_fn=<MeanBackward0>)
neg tensor(0.9032, grad_fn=<MeanBackward0>)
pos tensor(0.7865, grad_fn=<MeanBackward0>)
neg tensor(0.8699, grad_fn=<MeanBackward0>)
pos tensor(0.7712, grad_fn=<MeanBackward0>)
neg tensor(0.7067, grad_fn=<MeanBackward0>)
pos tensor(0.8808, grad_fn=<MeanBackward0>)
neg tensor(0.6948, grad_fn=<MeanBackward0>)
pos tensor(0.7024, grad_fn=<MeanBackward0>)
neg tensor(0.8964, grad_fn=<MeanBackward0>)
pos tensor(0.8574, grad_fn=<MeanBackward0>)
neg tensor(0.8870, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8787, grad_fn=<MeanBackward0>)
pos tensor(0.8364, grad_fn=<MeanBackward0>)
neg tensor(0.8469, grad_fn=<Mean

Training:   1%|█▌                                                                                                                                                         | 14/1352 [00:03<05:17,  4.21it/s]

neg tensor(0.7236, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.8771, grad_fn=<MeanBackward0>)
pos tensor(0.7823, grad_fn=<MeanBackward0>)
neg tensor(0.8719, grad_fn=<MeanBackward0>)
pos tensor(0.7849, grad_fn=<MeanBackward0>)
neg tensor(0.8587, grad_fn=<MeanBackward0>)
pos tensor(0.8604, grad_fn=<MeanBackward0>)
neg tensor(0.7893, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.6511, grad_fn=<MeanBackward0>)
pos tensor(0.6945, grad_fn=<MeanBackward0>)
neg tensor(0.9059, grad_fn=<MeanBackward0>)
pos tensor(0.8035, grad_fn=<MeanBackward0>)
neg tensor(0.8843, grad_fn=<MeanBackward0>)
pos tensor(0.7992, grad_fn=<MeanBackward0>)
neg tensor(0.8687, grad_fn=<MeanBackward0>)
pos tensor(0.8334, grad_fn=<MeanBackward0>)
neg tensor(0.9015, grad_fn=<MeanBackward0>)
pos tensor(0.8200, grad_fn=<MeanBackward0>)
neg tensor(0.7976, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9059, grad_fn=<MeanBackward

Training:   1%|█▋                                                                                                                                                         | 15/1352 [00:03<05:44,  3.88it/s]

neg tensor(0.9042, grad_fn=<MeanBackward0>)
pos tensor(0.7996, grad_fn=<MeanBackward0>)
neg tensor(0.8857, grad_fn=<MeanBackward0>)
pos tensor(0.8533, grad_fn=<MeanBackward0>)
neg tensor(0.5646, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.8678, grad_fn=<MeanBackward0>)
pos tensor(0.7789, grad_fn=<MeanBackward0>)
neg tensor(0.9177, grad_fn=<MeanBackward0>)
pos tensor(0.8152, grad_fn=<MeanBackward0>)
neg tensor(0.7703, grad_fn=<MeanBackward0>)
pos tensor(0.8231, grad_fn=<MeanBackward0>)
neg tensor(0.8891, grad_fn=<MeanBackward0>)
pos tensor(0.7975, grad_fn=<MeanBackward0>)
neg tensor(0.8897, grad_fn=<MeanBackward0>)
pos tensor(0.8015, grad_fn=<MeanBackward0>)
neg tensor(0.8669, grad_fn=<MeanBackward0>)
pos tensor(0.7950, grad_fn=<MeanBackward0>)
neg tensor(0.9024, grad_fn=<MeanBackward0>)
pos tensor(0.8062, grad_fn=<MeanBackward0>)
neg tensor(0.8543, grad_fn=<MeanBackward0>)
pos tensor(0.7785, grad_fn=<MeanBackward0>)
neg tensor(0.9054, grad_fn=<MeanBack

Training:   1%|█▊                                                                                                                                                         | 16/1352 [00:03<06:00,  3.71it/s]

neg tensor(0.9070, grad_fn=<MeanBackward0>)
pos tensor(0.8064, grad_fn=<MeanBackward0>)
neg tensor(0.7811, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9030, grad_fn=<MeanBackward0>)
pos tensor(0.7918, grad_fn=<MeanBackward0>)
neg tensor(0.8930, grad_fn=<MeanBackward0>)
pos tensor(0.7905, grad_fn=<MeanBackward0>)
neg tensor(0.8789, grad_fn=<MeanBackward0>)
pos tensor(0.8604, grad_fn=<MeanBackward0>)
neg tensor(0.9008, grad_fn=<MeanBackward0>)
pos tensor(0.9013, grad_fn=<MeanBackward0>)
neg tensor(0.9199, grad_fn=<MeanBackward0>)
pos tensor(0.8025, grad_fn=<MeanBackward0>)
neg tensor(0.9048, grad_fn=<MeanBackward0>)
pos tensor(0.8212, grad_fn=<MeanBackward0>)
neg tensor(0.8905, grad_fn=<MeanBackward0>)
pos tensor(0.8141, grad_fn=<MeanBackward0>)
neg tensor(0.8969, grad_fn=<MeanBackward0>)
pos tensor(0.8252, grad_fn=<MeanBackward0>)
neg tensor(0.8352, grad_fn=<MeanBackward0>)
pos tensor(0.8211, grad_fn=<MeanBackward0>)
neg tensor(0.8989, grad_fn=<MeanBack

Training:   1%|█▉                                                                                                                                                         | 17/1352 [00:04<05:56,  3.75it/s]

neg tensor(0.8967, grad_fn=<MeanBackward0>)
pos tensor(0.8085, grad_fn=<MeanBackward0>)
neg tensor(0.8855, grad_fn=<MeanBackward0>)
pos tensor(0.8156, grad_fn=<MeanBackward0>)
neg tensor(0.8923, grad_fn=<MeanBackward0>)
pos tensor(0.8273, grad_fn=<MeanBackward0>)
neg tensor(0.8509, grad_fn=<MeanBackward0>)
pos tensor(0.7826, grad_fn=<MeanBackward0>)
neg tensor(0.9151, grad_fn=<MeanBackward0>)
pos tensor(0.8601, grad_fn=<MeanBackward0>)
neg tensor(0.9082, grad_fn=<MeanBackward0>)
pos tensor(0.8123, grad_fn=<MeanBackward0>)
neg tensor(0.8815, grad_fn=<MeanBackward0>)
pos tensor(0.7841, grad_fn=<MeanBackward0>)
neg tensor(0.9106, grad_fn=<MeanBackward0>)
pos tensor(0.8576, grad_fn=<MeanBackward0>)
neg tensor(0.9034, grad_fn=<MeanBackward0>)
pos tensor(0.8036, grad_fn=<MeanBackward0>)
neg tensor(0.9114, grad_fn=<MeanBackward0>)
pos tensor(0.8478, grad_fn=<MeanBackward0>)
neg tensor(0.8388, grad_fn=<MeanBackward0>)
pos tensor(0.8057, grad_fn=<MeanBackward0>)
neg tensor(0.8929, grad_fn=<Mean

Training:   1%|██                                                                                                                                                         | 18/1352 [00:04<05:37,  3.95it/s]

neg tensor(0.9191, grad_fn=<MeanBackward0>)
pos tensor(0.8359, grad_fn=<MeanBackward0>)
neg tensor(0.8925, grad_fn=<MeanBackward0>)
pos tensor(0.8797, grad_fn=<MeanBackward0>)
neg tensor(0.8538, grad_fn=<MeanBackward0>)
pos tensor(0.8800, grad_fn=<MeanBackward0>)
neg tensor(0.8711, grad_fn=<MeanBackward0>)
pos tensor(0.8351, grad_fn=<MeanBackward0>)
neg tensor(0.8967, grad_fn=<MeanBackward0>)
pos tensor(0.8910, grad_fn=<MeanBackward0>)
neg tensor(0.9008, grad_fn=<MeanBackward0>)
pos tensor(0.8058, grad_fn=<MeanBackward0>)
neg tensor(0.9143, grad_fn=<MeanBackward0>)
pos tensor(0.8671, grad_fn=<MeanBackward0>)
neg tensor(0.8921, grad_fn=<MeanBackward0>)
pos tensor(0.8298, grad_fn=<MeanBackward0>)
neg tensor(0.8935, grad_fn=<MeanBackward0>)
pos tensor(0.8125, grad_fn=<MeanBackward0>)
neg tensor(0.8795, grad_fn=<MeanBackward0>)
pos tensor(0.8442, grad_fn=<MeanBackward0>)
neg tensor(0.7913, grad_fn=<MeanBackward0>)
pos tensor(0.8169, grad_fn=<MeanBackward0>)
neg tensor(0.8944, grad_fn=<Mean

Training:   1%|██▏                                                                                                                                                        | 19/1352 [00:04<06:18,  3.52it/s]

neg tensor(0.9246, grad_fn=<MeanBackward0>)
pos tensor(0.8383, grad_fn=<MeanBackward0>)
neg tensor(0.9056, grad_fn=<MeanBackward0>)
pos tensor(0.8539, grad_fn=<MeanBackward0>)
neg tensor(0.9014, grad_fn=<MeanBackward0>)
pos tensor(0.8210, grad_fn=<MeanBackward0>)
neg tensor(0.9119, grad_fn=<MeanBackward0>)
pos tensor(0.8076, grad_fn=<MeanBackward0>)
neg tensor(0.9089, grad_fn=<MeanBackward0>)
pos tensor(0.8560, grad_fn=<MeanBackward0>)
neg tensor(0.9157, grad_fn=<MeanBackward0>)
pos tensor(0.8447, grad_fn=<MeanBackward0>)
neg tensor(0.8830, grad_fn=<MeanBackward0>)
pos tensor(0.8528, grad_fn=<MeanBackward0>)
neg tensor(0.9079, grad_fn=<MeanBackward0>)
pos tensor(0.8143, grad_fn=<MeanBackward0>)
neg tensor(0.9129, grad_fn=<MeanBackward0>)
pos tensor(0.8524, grad_fn=<MeanBackward0>)
neg tensor(0.9088, grad_fn=<MeanBackward0>)
pos tensor(0.8623, grad_fn=<MeanBackward0>)
neg tensor(0.9155, grad_fn=<MeanBackward0>)
pos tensor(0.8326, grad_fn=<MeanBackward0>)
neg tensor(0.8081, grad_fn=<Mean

Training:   1%|██▎                                                                                                                                                        | 20/1352 [00:04<06:12,  3.57it/s]

neg tensor(0.9096, grad_fn=<MeanBackward0>)
pos tensor(0.8319, grad_fn=<MeanBackward0>)
neg tensor(0.9016, grad_fn=<MeanBackward0>)
pos tensor(0.8607, grad_fn=<MeanBackward0>)
neg tensor(0.9217, grad_fn=<MeanBackward0>)
pos tensor(0.8346, grad_fn=<MeanBackward0>)
neg tensor(0.9245, grad_fn=<MeanBackward0>)
pos tensor(0.8365, grad_fn=<MeanBackward0>)
neg tensor(0.9086, grad_fn=<MeanBackward0>)
pos tensor(0.8011, grad_fn=<MeanBackward0>)
neg tensor(0.8782, grad_fn=<MeanBackward0>)
pos tensor(0.7978, grad_fn=<MeanBackward0>)
neg tensor(0.9045, grad_fn=<MeanBackward0>)
pos tensor(0.8522, grad_fn=<MeanBackward0>)
neg tensor(0.8774, grad_fn=<MeanBackward0>)
pos tensor(0.8810, grad_fn=<MeanBackward0>)
neg tensor(0.9203, grad_fn=<MeanBackward0>)
pos tensor(0.8368, grad_fn=<MeanBackward0>)
neg tensor(0.8933, grad_fn=<MeanBackward0>)
pos tensor(0.8304, grad_fn=<MeanBackward0>)
neg tensor(0.9025, grad_fn=<MeanBackward0>)
pos tensor(0.7965, grad_fn=<MeanBackward0>)
neg tensor(0.9261, grad_fn=<Mean

Training:   2%|██▍                                                                                                                                                        | 21/1352 [00:05<05:59,  3.70it/s]

neg tensor(0.8989, grad_fn=<MeanBackward0>)
pos tensor(0.8416, grad_fn=<MeanBackward0>)
neg tensor(0.9053, grad_fn=<MeanBackward0>)
pos tensor(0.9145, grad_fn=<MeanBackward0>)
neg tensor(0.8841, grad_fn=<MeanBackward0>)
pos tensor(0.8282, grad_fn=<MeanBackward0>)
neg tensor(0.9246, grad_fn=<MeanBackward0>)
pos tensor(0.8664, grad_fn=<MeanBackward0>)
neg tensor(0.8538, grad_fn=<MeanBackward0>)
pos tensor(0.8938, grad_fn=<MeanBackward0>)
neg tensor(0.9258, grad_fn=<MeanBackward0>)
pos tensor(0.8351, grad_fn=<MeanBackward0>)
neg tensor(0.9126, grad_fn=<MeanBackward0>)
pos tensor(0.8575, grad_fn=<MeanBackward0>)
neg tensor(0.8987, grad_fn=<MeanBackward0>)
pos tensor(0.8391, grad_fn=<MeanBackward0>)
neg tensor(0.9150, grad_fn=<MeanBackward0>)
pos tensor(0.8283, grad_fn=<MeanBackward0>)
neg tensor(0.9192, grad_fn=<MeanBackward0>)
pos tensor(0.9207, grad_fn=<MeanBackward0>)
neg tensor(0.9073, grad_fn=<MeanBackward0>)
pos tensor(0.8435, grad_fn=<MeanBackward0>)
neg tensor(0.9130, grad_fn=<Mean

Training:   2%|██▌                                                                                                                                                        | 22/1352 [00:05<05:29,  4.03it/s]

neg tensor(0.9345, grad_fn=<MeanBackward0>)
pos tensor(0.8669, grad_fn=<MeanBackward0>)
neg tensor(0.8893, grad_fn=<MeanBackward0>)
pos tensor(0.8845, grad_fn=<MeanBackward0>)
neg tensor(0.9219, grad_fn=<MeanBackward0>)
pos tensor(0.8767, grad_fn=<MeanBackward0>)
neg tensor(0.9143, grad_fn=<MeanBackward0>)
pos tensor(0.9249, grad_fn=<MeanBackward0>)
neg tensor(0.8483, grad_fn=<MeanBackward0>)
pos tensor(0.8347, grad_fn=<MeanBackward0>)
neg tensor(0.7763, grad_fn=<MeanBackward0>)
pos tensor(0.8261, grad_fn=<MeanBackward0>)
neg tensor(0.7368, grad_fn=<MeanBackward0>)
pos tensor(0.7495, grad_fn=<MeanBackward0>)
neg tensor(0.9232, grad_fn=<MeanBackward0>)
pos tensor(0.8353, grad_fn=<MeanBackward0>)
neg tensor(0.8477, grad_fn=<MeanBackward0>)
pos tensor(0.8421, grad_fn=<MeanBackward0>)
neg tensor(0.9223, grad_fn=<MeanBackward0>)
pos tensor(0.8798, grad_fn=<MeanBackward0>)
neg tensor(0.9100, grad_fn=<MeanBackward0>)
pos tensor(0.8724, grad_fn=<MeanBackward0>)
neg tensor(0.9043, grad_fn=<Mean

Training:   2%|██▋                                                                                                                                                        | 23/1352 [00:05<05:35,  3.96it/s]

neg tensor(0.9048, grad_fn=<MeanBackward0>)
pos tensor(0.8352, grad_fn=<MeanBackward0>)
neg tensor(0.9220, grad_fn=<MeanBackward0>)
pos tensor(0.8411, grad_fn=<MeanBackward0>)
neg tensor(0.9155, grad_fn=<MeanBackward0>)
pos tensor(0.8638, grad_fn=<MeanBackward0>)
neg tensor(0.8911, grad_fn=<MeanBackward0>)
pos tensor(0.8845, grad_fn=<MeanBackward0>)
neg tensor(0.9207, grad_fn=<MeanBackward0>)
pos tensor(0.8510, grad_fn=<MeanBackward0>)
neg tensor(0.9195, grad_fn=<MeanBackward0>)
pos tensor(0.8558, grad_fn=<MeanBackward0>)
neg tensor(0.9227, grad_fn=<MeanBackward0>)
pos tensor(0.8603, grad_fn=<MeanBackward0>)
neg tensor(0.9281, grad_fn=<MeanBackward0>)
pos tensor(0.8504, grad_fn=<MeanBackward0>)
neg tensor(0.9156, grad_fn=<MeanBackward0>)
pos tensor(0.8697, grad_fn=<MeanBackward0>)
neg tensor(0.8618, grad_fn=<MeanBackward0>)
pos tensor(0.7626, grad_fn=<MeanBackward0>)
neg tensor(0.9260, grad_fn=<MeanBackward0>)
pos tensor(0.8604, grad_fn=<MeanBackward0>)
neg tensor(0.9134, grad_fn=<Mean

Training:   2%|██▊                                                                                                                                                        | 24/1352 [00:05<05:31,  4.00it/s]

neg tensor(0.9022, grad_fn=<MeanBackward0>)
pos tensor(0.8509, grad_fn=<MeanBackward0>)
neg tensor(0.9211, grad_fn=<MeanBackward0>)
pos tensor(0.8268, grad_fn=<MeanBackward0>)
neg tensor(0.9073, grad_fn=<MeanBackward0>)
pos tensor(0.8750, grad_fn=<MeanBackward0>)
neg tensor(0.9176, grad_fn=<MeanBackward0>)
pos tensor(0.8867, grad_fn=<MeanBackward0>)
neg tensor(0.9141, grad_fn=<MeanBackward0>)
pos tensor(0.8633, grad_fn=<MeanBackward0>)
neg tensor(0.9274, grad_fn=<MeanBackward0>)
pos tensor(0.8558, grad_fn=<MeanBackward0>)
neg tensor(0.9274, grad_fn=<MeanBackward0>)
pos tensor(0.8489, grad_fn=<MeanBackward0>)
neg tensor(0.9041, grad_fn=<MeanBackward0>)
pos tensor(0.8524, grad_fn=<MeanBackward0>)
neg tensor(0.9208, grad_fn=<MeanBackward0>)
pos tensor(0.8555, grad_fn=<MeanBackward0>)
neg tensor(0.9085, grad_fn=<MeanBackward0>)
pos tensor(0.8474, grad_fn=<MeanBackward0>)
neg tensor(0.8472, grad_fn=<MeanBackward0>)
pos tensor(0.8661, grad_fn=<MeanBackward0>)
neg tensor(0.8860, grad_fn=<Mean

Training:   2%|██▊                                                                                                                                                        | 25/1352 [00:06<05:33,  3.97it/s]

neg tensor(0.8846, grad_fn=<MeanBackward0>)
pos tensor(0.8946, grad_fn=<MeanBackward0>)
neg tensor(0.9269, grad_fn=<MeanBackward0>)
pos tensor(0.8513, grad_fn=<MeanBackward0>)
neg tensor(0.9341, grad_fn=<MeanBackward0>)
pos tensor(0.8694, grad_fn=<MeanBackward0>)
neg tensor(0.9265, grad_fn=<MeanBackward0>)
pos tensor(0.8754, grad_fn=<MeanBackward0>)
neg tensor(0.9321, grad_fn=<MeanBackward0>)
pos tensor(0.8652, grad_fn=<MeanBackward0>)
neg tensor(0.9326, grad_fn=<MeanBackward0>)
pos tensor(0.8681, grad_fn=<MeanBackward0>)
neg tensor(0.9259, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8946, grad_fn=<MeanBackward0>)
pos tensor(0.8840, grad_fn=<MeanBackward0>)
neg tensor(0.9139, grad_fn=<MeanBackward0>)
pos tensor(0.8598, grad_fn=<MeanBackward0>)
neg tensor(0.8874, grad_fn=<MeanBackward0>)
pos tensor(0.8235, grad_fn=<MeanBackward0>)
neg tensor(0.9134, grad_fn=<MeanBackward0>)
pos tensor(0.8548, grad_fn=<MeanBackward0>)
neg tensor(0.9253, grad_fn=<Mean

Training:   2%|██▉                                                                                                                                                        | 26/1352 [00:06<05:29,  4.03it/s]

neg tensor(0.9129, grad_fn=<MeanBackward0>)
pos tensor(0.8492, grad_fn=<MeanBackward0>)
neg tensor(0.9172, grad_fn=<MeanBackward0>)
pos tensor(0.8654, grad_fn=<MeanBackward0>)
neg tensor(0.9333, grad_fn=<MeanBackward0>)
pos tensor(0.9495, grad_fn=<MeanBackward0>)
neg tensor(0.9242, grad_fn=<MeanBackward0>)
pos tensor(0.8950, grad_fn=<MeanBackward0>)
neg tensor(0.9178, grad_fn=<MeanBackward0>)
pos tensor(0.8411, grad_fn=<MeanBackward0>)
neg tensor(0.9323, grad_fn=<MeanBackward0>)
pos tensor(0.8694, grad_fn=<MeanBackward0>)
neg tensor(0.9229, grad_fn=<MeanBackward0>)
pos tensor(0.8788, grad_fn=<MeanBackward0>)
neg tensor(0.9348, grad_fn=<MeanBackward0>)
pos tensor(0.8702, grad_fn=<MeanBackward0>)
neg tensor(0.9201, grad_fn=<MeanBackward0>)
pos tensor(0.9045, grad_fn=<MeanBackward0>)
neg tensor(-0.0712, grad_fn=<MeanBackward0>)
pos tensor(0.8450, grad_fn=<MeanBackward0>)
neg tensor(0.9215, grad_fn=<MeanBackward0>)
pos tensor(0.8568, grad_fn=<MeanBackward0>)
neg tensor(0.9155, grad_fn=<Mea

Training:   2%|███                                                                                                                                                        | 27/1352 [00:06<05:37,  3.92it/s]

neg tensor(0.9289, grad_fn=<MeanBackward0>)
pos tensor(0.8567, grad_fn=<MeanBackward0>)
neg tensor(0.8919, grad_fn=<MeanBackward0>)
pos tensor(0.8322, grad_fn=<MeanBackward0>)
neg tensor(0.9393, grad_fn=<MeanBackward0>)
pos tensor(0.8856, grad_fn=<MeanBackward0>)
neg tensor(0.9371, grad_fn=<MeanBackward0>)
pos tensor(0.8712, grad_fn=<MeanBackward0>)
neg tensor(0.8895, grad_fn=<MeanBackward0>)
pos tensor(0.9175, grad_fn=<MeanBackward0>)
neg tensor(0.9380, grad_fn=<MeanBackward0>)
pos tensor(0.8621, grad_fn=<MeanBackward0>)
neg tensor(0.9285, grad_fn=<MeanBackward0>)
pos tensor(0.8692, grad_fn=<MeanBackward0>)
neg tensor(0.9345, grad_fn=<MeanBackward0>)
pos tensor(0.8638, grad_fn=<MeanBackward0>)
neg tensor(0.9131, grad_fn=<MeanBackward0>)
pos tensor(0.8372, grad_fn=<MeanBackward0>)
neg tensor(0.9234, grad_fn=<MeanBackward0>)
pos tensor(0.9182, grad_fn=<MeanBackward0>)
neg tensor(0.9327, grad_fn=<MeanBackward0>)
pos tensor(0.8870, grad_fn=<MeanBackward0>)
neg tensor(0.9149, grad_fn=<Mean

Training:   2%|███▏                                                                                                                                                       | 28/1352 [00:06<05:33,  3.97it/s]

neg tensor(0.9354, grad_fn=<MeanBackward0>)
pos tensor(0.8681, grad_fn=<MeanBackward0>)
neg tensor(0.9087, grad_fn=<MeanBackward0>)
pos tensor(0.8562, grad_fn=<MeanBackward0>)
neg tensor(0.9335, grad_fn=<MeanBackward0>)
pos tensor(0.8823, grad_fn=<MeanBackward0>)
neg tensor(0.9270, grad_fn=<MeanBackward0>)
pos tensor(0.8673, grad_fn=<MeanBackward0>)
neg tensor(0.8403, grad_fn=<MeanBackward0>)
pos tensor(0.8531, grad_fn=<MeanBackward0>)
neg tensor(0.4810, grad_fn=<MeanBackward0>)
pos tensor(0.8049, grad_fn=<MeanBackward0>)
neg tensor(0.9304, grad_fn=<MeanBackward0>)
pos tensor(0.8689, grad_fn=<MeanBackward0>)
neg tensor(0.9299, grad_fn=<MeanBackward0>)
pos tensor(0.8802, grad_fn=<MeanBackward0>)
neg tensor(0.9245, grad_fn=<MeanBackward0>)
pos tensor(0.8790, grad_fn=<MeanBackward0>)
neg tensor(-0.0359, grad_fn=<MeanBackward0>)
pos tensor(0.7985, grad_fn=<MeanBackward0>)
neg tensor(0.9352, grad_fn=<MeanBackward0>)
pos tensor(0.9095, grad_fn=<MeanBackward0>)
neg tensor(0.9195, grad_fn=<Mea

Training:   2%|███▎                                                                                                                                                       | 29/1352 [00:07<05:21,  4.12it/s]

neg tensor(0.8881, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.8603, grad_fn=<MeanBackward0>)
pos tensor(0.9270, grad_fn=<MeanBackward0>)
neg tensor(0.9263, grad_fn=<MeanBackward0>)
pos tensor(0.9060, grad_fn=<MeanBackward0>)
neg tensor(0.9247, grad_fn=<MeanBackward0>)
pos tensor(0.8651, grad_fn=<MeanBackward0>)
neg tensor(0.9317, grad_fn=<MeanBackward0>)
pos tensor(0.8898, grad_fn=<MeanBackward0>)
neg tensor(0.9258, grad_fn=<MeanBackward0>)
pos tensor(0.8664, grad_fn=<MeanBackward0>)
neg tensor(0.9349, grad_fn=<MeanBackward0>)
pos tensor(0.9107, grad_fn=<MeanBackward0>)
neg tensor(0.9326, grad_fn=<MeanBackward0>)
pos tensor(0.8679, grad_fn=<MeanBackward0>)
neg tensor(0.9293, grad_fn=<MeanBackward0>)
pos tensor(0.8717, grad_fn=<MeanBackward0>)
neg tensor(0.9395, grad_fn=<MeanBackward0>)
pos tensor(0.8993, grad_fn=<MeanBackward0>)
neg tensor(0.9299, grad_fn=<MeanBackward0>)
pos tensor(0.8905, grad_fn=<MeanBackward0>)
neg tensor(0.9309, grad_fn=<MeanBack

Training:   2%|███▍                                                                                                                                                       | 30/1352 [00:07<05:08,  4.29it/s]

neg tensor(0.9367, grad_fn=<MeanBackward0>)
pos tensor(0.8799, grad_fn=<MeanBackward0>)
neg tensor(0.9318, grad_fn=<MeanBackward0>)
pos tensor(0.8782, grad_fn=<MeanBackward0>)
neg tensor(0.9241, grad_fn=<MeanBackward0>)
pos tensor(0.9093, grad_fn=<MeanBackward0>)
neg tensor(0.8783, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8896, grad_fn=<MeanBackward0>)
pos tensor(0.8682, grad_fn=<MeanBackward0>)
neg tensor(0.9354, grad_fn=<MeanBackward0>)
pos tensor(0.8667, grad_fn=<MeanBackward0>)
neg tensor(0.2544, grad_fn=<MeanBackward0>)
pos tensor(0.8796, grad_fn=<MeanBackward0>)
neg tensor(0.8873, grad_fn=<MeanBackward0>)
pos tensor(0.9629, grad_fn=<MeanBackward0>)
neg tensor(0.9404, grad_fn=<MeanBackward0>)
pos tensor(0.9023, grad_fn=<MeanBackward0>)
neg tensor(0.9343, grad_fn=<MeanBackward0>)
pos tensor(0.8782, grad_fn=<MeanBackward0>)
neg tensor(0.9172, grad_fn=<MeanBackward0>)
pos tensor(0.8815, grad_fn=<MeanBackward0>)
neg tensor(0.9194, grad_fn=<Mean

Training:   2%|███▌                                                                                                                                                       | 31/1352 [00:07<05:34,  3.95it/s]

neg tensor(0.9061, grad_fn=<MeanBackward0>)
pos tensor(0.8835, grad_fn=<MeanBackward0>)
neg tensor(0.9233, grad_fn=<MeanBackward0>)
pos tensor(0.8740, grad_fn=<MeanBackward0>)
neg tensor(0.9262, grad_fn=<MeanBackward0>)
pos tensor(0.8811, grad_fn=<MeanBackward0>)
neg tensor(0.9443, grad_fn=<MeanBackward0>)
pos tensor(0.8859, grad_fn=<MeanBackward0>)
neg tensor(0.9317, grad_fn=<MeanBackward0>)
pos tensor(0.8948, grad_fn=<MeanBackward0>)
neg tensor(0.9479, grad_fn=<MeanBackward0>)
pos tensor(0.8917, grad_fn=<MeanBackward0>)
neg tensor(0.9488, grad_fn=<MeanBackward0>)
pos tensor(0.8905, grad_fn=<MeanBackward0>)
neg tensor(0.9277, grad_fn=<MeanBackward0>)
pos tensor(0.9230, grad_fn=<MeanBackward0>)
neg tensor(0.9434, grad_fn=<MeanBackward0>)
pos tensor(0.8920, grad_fn=<MeanBackward0>)
neg tensor(0.9378, grad_fn=<MeanBackward0>)
pos tensor(0.8836, grad_fn=<MeanBackward0>)
neg tensor(0.9359, grad_fn=<MeanBackward0>)
pos tensor(0.9076, grad_fn=<MeanBackward0>)
neg tensor(0.9315, grad_fn=<Mean

Training:   2%|███▋                                                                                                                                                       | 32/1352 [00:07<05:32,  3.97it/s]

neg tensor(0.9304, grad_fn=<MeanBackward0>)
pos tensor(0.8880, grad_fn=<MeanBackward0>)
neg tensor(0.9485, grad_fn=<MeanBackward0>)
pos tensor(0.8818, grad_fn=<MeanBackward0>)
neg tensor(0.9197, grad_fn=<MeanBackward0>)
pos tensor(0.9159, grad_fn=<MeanBackward0>)
neg tensor(0.9098, grad_fn=<MeanBackward0>)
pos tensor(0.8767, grad_fn=<MeanBackward0>)
neg tensor(0.9388, grad_fn=<MeanBackward0>)
pos tensor(0.9287, grad_fn=<MeanBackward0>)
neg tensor(0.9244, grad_fn=<MeanBackward0>)
pos tensor(0.8851, grad_fn=<MeanBackward0>)
neg tensor(0.9424, grad_fn=<MeanBackward0>)
pos tensor(0.8968, grad_fn=<MeanBackward0>)
neg tensor(0.9130, grad_fn=<MeanBackward0>)
pos tensor(0.9080, grad_fn=<MeanBackward0>)
neg tensor(0.9348, grad_fn=<MeanBackward0>)
pos tensor(0.9031, grad_fn=<MeanBackward0>)
neg tensor(0.9309, grad_fn=<MeanBackward0>)
pos tensor(0.9084, grad_fn=<MeanBackward0>)
neg tensor(0.9212, grad_fn=<MeanBackward0>)
pos tensor(0.8833, grad_fn=<MeanBackward0>)
neg tensor(0.9414, grad_fn=<Mean

Training:   2%|███▊                                                                                                                                                       | 33/1352 [00:08<05:32,  3.97it/s]

neg tensor(0.9115, grad_fn=<MeanBackward0>)
pos tensor(0.9059, grad_fn=<MeanBackward0>)
neg tensor(0.9436, grad_fn=<MeanBackward0>)
pos tensor(0.8719, grad_fn=<MeanBackward0>)
neg tensor(0.9465, grad_fn=<MeanBackward0>)
pos tensor(0.9048, grad_fn=<MeanBackward0>)
neg tensor(0.9394, grad_fn=<MeanBackward0>)
pos tensor(0.8986, grad_fn=<MeanBackward0>)
neg tensor(0.9123, grad_fn=<MeanBackward0>)
pos tensor(0.8395, grad_fn=<MeanBackward0>)
neg tensor(0.9223, grad_fn=<MeanBackward0>)
pos tensor(0.8948, grad_fn=<MeanBackward0>)
neg tensor(0.9448, grad_fn=<MeanBackward0>)
pos tensor(0.8857, grad_fn=<MeanBackward0>)
neg tensor(0.9302, grad_fn=<MeanBackward0>)
pos tensor(0.8828, grad_fn=<MeanBackward0>)
neg tensor(0.9545, grad_fn=<MeanBackward0>)
pos tensor(0.9160, grad_fn=<MeanBackward0>)
neg tensor(0.9166, grad_fn=<MeanBackward0>)
pos tensor(0.9083, grad_fn=<MeanBackward0>)
neg tensor(0.9070, grad_fn=<MeanBackward0>)
pos tensor(0.8697, grad_fn=<MeanBackward0>)
neg tensor(0.9419, grad_fn=<Mean

Training:   3%|███▉                                                                                                                                                       | 34/1352 [00:08<05:52,  3.74it/s]

neg tensor(0.9502, grad_fn=<MeanBackward0>)
pos tensor(0.9160, grad_fn=<MeanBackward0>)
neg tensor(0.9320, grad_fn=<MeanBackward0>)
pos tensor(0.8903, grad_fn=<MeanBackward0>)
neg tensor(0.8966, grad_fn=<MeanBackward0>)
pos tensor(0.9194, grad_fn=<MeanBackward0>)
neg tensor(0.9009, grad_fn=<MeanBackward0>)
pos tensor(0.9064, grad_fn=<MeanBackward0>)
neg tensor(0.9390, grad_fn=<MeanBackward0>)
pos tensor(0.9064, grad_fn=<MeanBackward0>)
neg tensor(0.9506, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9436, grad_fn=<MeanBackward0>)
pos tensor(0.8847, grad_fn=<MeanBackward0>)
neg tensor(0.9518, grad_fn=<MeanBackward0>)
pos tensor(0.9067, grad_fn=<MeanBackward0>)
neg tensor(0.9473, grad_fn=<MeanBackward0>)
pos tensor(0.8865, grad_fn=<MeanBackward0>)
neg tensor(0.9514, grad_fn=<MeanBackward0>)
pos tensor(0.8991, grad_fn=<MeanBackward0>)
neg tensor(0.9398, grad_fn=<MeanBackward0>)
pos tensor(0.8830, grad_fn=<MeanBackward0>)
neg tensor(0.9465, grad_fn=<Mean

Training:   3%|████                                                                                                                                                       | 35/1352 [00:08<06:15,  3.51it/s]

neg tensor(0.9437, grad_fn=<MeanBackward0>)
pos tensor(0.8852, grad_fn=<MeanBackward0>)
neg tensor(0.9445, grad_fn=<MeanBackward0>)
pos tensor(0.9107, grad_fn=<MeanBackward0>)
neg tensor(0.9488, grad_fn=<MeanBackward0>)
pos tensor(0.9112, grad_fn=<MeanBackward0>)
neg tensor(0.9305, grad_fn=<MeanBackward0>)
pos tensor(0.9197, grad_fn=<MeanBackward0>)
neg tensor(0.9449, grad_fn=<MeanBackward0>)
pos tensor(0.9024, grad_fn=<MeanBackward0>)
neg tensor(0.8774, grad_fn=<MeanBackward0>)
pos tensor(0.8855, grad_fn=<MeanBackward0>)
neg tensor(0.9421, grad_fn=<MeanBackward0>)
pos tensor(0.9017, grad_fn=<MeanBackward0>)
neg tensor(0.9428, grad_fn=<MeanBackward0>)
pos tensor(0.9044, grad_fn=<MeanBackward0>)
neg tensor(0.9453, grad_fn=<MeanBackward0>)
pos tensor(0.8901, grad_fn=<MeanBackward0>)
neg tensor(0.9377, grad_fn=<MeanBackward0>)
pos tensor(0.8896, grad_fn=<MeanBackward0>)
neg tensor(0.9483, grad_fn=<MeanBackward0>)
pos tensor(0.8978, grad_fn=<MeanBackward0>)
neg tensor(0.9389, grad_fn=<Mean

Training:   3%|████▏                                                                                                                                                      | 36/1352 [00:09<05:42,  3.84it/s]

neg tensor(0.9184, grad_fn=<MeanBackward0>)
pos tensor(0.8915, grad_fn=<MeanBackward0>)
neg tensor(0.9129, grad_fn=<MeanBackward0>)
pos tensor(0.9004, grad_fn=<MeanBackward0>)
neg tensor(0.9513, grad_fn=<MeanBackward0>)
pos tensor(0.9345, grad_fn=<MeanBackward0>)
neg tensor(0.9226, grad_fn=<MeanBackward0>)
pos tensor(0.9008, grad_fn=<MeanBackward0>)
neg tensor(0.9474, grad_fn=<MeanBackward0>)
pos tensor(0.8961, grad_fn=<MeanBackward0>)
neg tensor(0.9298, grad_fn=<MeanBackward0>)
pos tensor(0.9441, grad_fn=<MeanBackward0>)
neg tensor(0.9142, grad_fn=<MeanBackward0>)
pos tensor(0.8969, grad_fn=<MeanBackward0>)
neg tensor(0.9464, grad_fn=<MeanBackward0>)
pos tensor(0.8914, grad_fn=<MeanBackward0>)
neg tensor(0.9408, grad_fn=<MeanBackward0>)
pos tensor(0.9033, grad_fn=<MeanBackward0>)
neg tensor(0.9556, grad_fn=<MeanBackward0>)
pos tensor(0.9347, grad_fn=<MeanBackward0>)
neg tensor(0.9216, grad_fn=<MeanBackward0>)
pos tensor(0.9502, grad_fn=<MeanBackward0>)
neg tensor(0.9321, grad_fn=<Mean

Training:   3%|████▏                                                                                                                                                      | 37/1352 [00:09<05:17,  4.14it/s]

neg tensor(0.9079, grad_fn=<MeanBackward0>)
pos tensor(0.8771, grad_fn=<MeanBackward0>)
neg tensor(0.9485, grad_fn=<MeanBackward0>)
pos tensor(0.8961, grad_fn=<MeanBackward0>)
neg tensor(0.9374, grad_fn=<MeanBackward0>)
pos tensor(0.9066, grad_fn=<MeanBackward0>)
neg tensor(0.9114, grad_fn=<MeanBackward0>)
pos tensor(0.9239, grad_fn=<MeanBackward0>)
neg tensor(0.8932, grad_fn=<MeanBackward0>)
pos tensor(0.9429, grad_fn=<MeanBackward0>)
neg tensor(0.9428, grad_fn=<MeanBackward0>)
pos tensor(0.9487, grad_fn=<MeanBackward0>)
neg tensor(0.9130, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9286, grad_fn=<MeanBackward0>)
pos tensor(0.9045, grad_fn=<MeanBackward0>)
neg tensor(0.9396, grad_fn=<MeanBackward0>)
pos tensor(0.9008, grad_fn=<MeanBackward0>)
neg tensor(0.9338, grad_fn=<MeanBackward0>)
pos tensor(0.8818, grad_fn=<MeanBackward0>)
neg tensor(0.9384, grad_fn=<MeanBackward0>)
pos tensor(0.8908, grad_fn=<MeanBackward0>)


Training:   3%|████▎                                                                                                                                                      | 38/1352 [00:09<05:38,  3.88it/s]

neg tensor(0.9416, grad_fn=<MeanBackward0>)
pos tensor(0.8924, grad_fn=<MeanBackward0>)
neg tensor(0.9439, grad_fn=<MeanBackward0>)
pos tensor(0.9067, grad_fn=<MeanBackward0>)
neg tensor(0.9505, grad_fn=<MeanBackward0>)
pos tensor(0.8931, grad_fn=<MeanBackward0>)
neg tensor(0.9345, grad_fn=<MeanBackward0>)
pos tensor(0.8920, grad_fn=<MeanBackward0>)
neg tensor(0.9515, grad_fn=<MeanBackward0>)
pos tensor(0.9001, grad_fn=<MeanBackward0>)
neg tensor(0.9502, grad_fn=<MeanBackward0>)
pos tensor(0.8886, grad_fn=<MeanBackward0>)
neg tensor(0.9506, grad_fn=<MeanBackward0>)
pos tensor(0.9086, grad_fn=<MeanBackward0>)
neg tensor(0.9071, grad_fn=<MeanBackward0>)
pos tensor(0.9277, grad_fn=<MeanBackward0>)
neg tensor(0.9491, grad_fn=<MeanBackward0>)
pos tensor(0.9313, grad_fn=<MeanBackward0>)
neg tensor(0.9517, grad_fn=<MeanBackward0>)
pos tensor(0.8955, grad_fn=<MeanBackward0>)
neg tensor(0.9403, grad_fn=<MeanBackward0>)
pos tensor(0.9303, grad_fn=<MeanBackward0>)
neg tensor(0.9060, grad_fn=<Mean

Training:   3%|████▍                                                                                                                                                      | 39/1352 [00:09<05:28,  4.00it/s]

neg tensor(0.8905, grad_fn=<MeanBackward0>)
pos tensor(0.8561, grad_fn=<MeanBackward0>)
neg tensor(0.9439, grad_fn=<MeanBackward0>)
pos tensor(0.9135, grad_fn=<MeanBackward0>)
neg tensor(0.9208, grad_fn=<MeanBackward0>)
pos tensor(0.9284, grad_fn=<MeanBackward0>)
neg tensor(0.9498, grad_fn=<MeanBackward0>)
pos tensor(0.8959, grad_fn=<MeanBackward0>)
neg tensor(0.9391, grad_fn=<MeanBackward0>)
pos tensor(0.8945, grad_fn=<MeanBackward0>)
neg tensor(0.9491, grad_fn=<MeanBackward0>)
pos tensor(0.8949, grad_fn=<MeanBackward0>)
neg tensor(-0.2228, grad_fn=<MeanBackward0>)
pos tensor(0.8612, grad_fn=<MeanBackward0>)
neg tensor(0.9267, grad_fn=<MeanBackward0>)
pos tensor(0.9100, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9133, grad_fn=<MeanBackward0>)
neg tensor(0.9323, grad_fn=<MeanBackward0>)
pos tensor(0.9447, grad_fn=<MeanBackward0>)
neg tensor(0.9392, grad_fn=<MeanBackward0>)
pos tensor(0.9100, grad_fn=<MeanBackward0>)
neg tensor(0.9418, grad_fn=<Mea

Training:   3%|████▌                                                                                                                                                      | 40/1352 [00:09<05:10,  4.23it/s]

neg tensor(0.9488, grad_fn=<MeanBackward0>)
pos tensor(0.9212, grad_fn=<MeanBackward0>)
neg tensor(0.7410, grad_fn=<MeanBackward0>)
pos tensor(0.8729, grad_fn=<MeanBackward0>)
neg tensor(0.9510, grad_fn=<MeanBackward0>)
pos tensor(0.9136, grad_fn=<MeanBackward0>)
neg tensor(0.9143, grad_fn=<MeanBackward0>)
pos tensor(0.9072, grad_fn=<MeanBackward0>)
neg tensor(0.9143, grad_fn=<MeanBackward0>)
pos tensor(0.9214, grad_fn=<MeanBackward0>)
neg tensor(0.9343, grad_fn=<MeanBackward0>)
pos tensor(0.9138, grad_fn=<MeanBackward0>)
neg tensor(0.9535, grad_fn=<MeanBackward0>)
pos tensor(0.9070, grad_fn=<MeanBackward0>)
neg tensor(0.9305, grad_fn=<MeanBackward0>)
pos tensor(0.9397, grad_fn=<MeanBackward0>)
neg tensor(0.9314, grad_fn=<MeanBackward0>)
pos tensor(0.8761, grad_fn=<MeanBackward0>)
neg tensor(0.9421, grad_fn=<MeanBackward0>)
pos tensor(0.9293, grad_fn=<MeanBackward0>)
neg tensor(0.9384, grad_fn=<MeanBackward0>)
pos tensor(0.9082, grad_fn=<MeanBackward0>)
neg tensor(0.9412, grad_fn=<Mean

Training:   3%|████▋                                                                                                                                                      | 41/1352 [00:10<04:43,  4.63it/s]

tensor(0.9281, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9438, grad_fn=<MeanBackward0>)
pos tensor(0.9351, grad_fn=<MeanBackward0>)
neg tensor(0.8978, grad_fn=<MeanBackward0>)
pos tensor(0.8728, grad_fn=<MeanBackward0>)
neg tensor(0.9301, grad_fn=<MeanBackward0>)
pos tensor(0.9044, grad_fn=<MeanBackward0>)
neg tensor(0.9362, grad_fn=<MeanBackward0>)
pos tensor(0.9447, grad_fn=<MeanBackward0>)


Training:   3%|████▊                                                                                                                                                      | 42/1352 [00:10<05:00,  4.36it/s]

neg tensor(0.9171, grad_fn=<MeanBackward0>)
pos tensor(0.9064, grad_fn=<MeanBackward0>)
neg tensor(0.9234, grad_fn=<MeanBackward0>)
pos tensor(0.9033, grad_fn=<MeanBackward0>)
neg tensor(0.9470, grad_fn=<MeanBackward0>)
pos tensor(0.9413, grad_fn=<MeanBackward0>)
neg tensor(0.9429, grad_fn=<MeanBackward0>)
pos tensor(0.9324, grad_fn=<MeanBackward0>)
neg tensor(0.9555, grad_fn=<MeanBackward0>)
pos tensor(0.9168, grad_fn=<MeanBackward0>)
neg tensor(0.9534, grad_fn=<MeanBackward0>)
pos tensor(0.9279, grad_fn=<MeanBackward0>)
neg tensor(0.9428, grad_fn=<MeanBackward0>)
pos tensor(0.9182, grad_fn=<MeanBackward0>)
neg tensor(0.9499, grad_fn=<MeanBackward0>)
pos tensor(0.9094, grad_fn=<MeanBackward0>)
neg tensor(0.9493, grad_fn=<MeanBackward0>)
pos tensor(0.9046, grad_fn=<MeanBackward0>)
neg tensor(0.9540, grad_fn=<MeanBackward0>)
pos tensor(0.9013, grad_fn=<MeanBackward0>)
neg tensor(0.9382, grad_fn=<MeanBackward0>)
pos tensor(0.8953, grad_fn=<MeanBackward0>)
neg tensor(0.9452, grad_fn=<Mean

Training:   3%|████▉                                                                                                                                                      | 43/1352 [00:10<04:59,  4.36it/s]

neg tensor(0.9560, grad_fn=<MeanBackward0>)
pos tensor(0.9486, grad_fn=<MeanBackward0>)
neg tensor(0.9364, grad_fn=<MeanBackward0>)
pos tensor(0.9452, grad_fn=<MeanBackward0>)
neg tensor(0.9386, grad_fn=<MeanBackward0>)
pos tensor(0.9194, grad_fn=<MeanBackward0>)
neg tensor(0.8865, grad_fn=<MeanBackward0>)
pos tensor(0.9151, grad_fn=<MeanBackward0>)
neg tensor(0.9489, grad_fn=<MeanBackward0>)
pos tensor(0.9103, grad_fn=<MeanBackward0>)
neg tensor(0.9485, grad_fn=<MeanBackward0>)
pos tensor(0.9050, grad_fn=<MeanBackward0>)
neg tensor(0.9373, grad_fn=<MeanBackward0>)
pos tensor(0.8835, grad_fn=<MeanBackward0>)
neg tensor(0.9403, grad_fn=<MeanBackward0>)
pos tensor(0.9070, grad_fn=<MeanBackward0>)
neg tensor(0.9501, grad_fn=<MeanBackward0>)
pos tensor(0.9201, grad_fn=<MeanBackward0>)
neg tensor(0.9543, grad_fn=<MeanBackward0>)
pos tensor(0.9278, grad_fn=<MeanBackward0>)
neg tensor(0.9508, grad_fn=<MeanBackward0>)
pos tensor(0.9383, grad_fn=<MeanBackward0>)
neg tensor(0.9507, grad_fn=<Mean

Training:   3%|█████                                                                                                                                                      | 44/1352 [00:10<05:22,  4.05it/s]

neg tensor(0.9558, grad_fn=<MeanBackward0>)
pos tensor(0.9110, grad_fn=<MeanBackward0>)
neg tensor(0.9492, grad_fn=<MeanBackward0>)
pos tensor(0.9538, grad_fn=<MeanBackward0>)
neg tensor(0.9505, grad_fn=<MeanBackward0>)
pos tensor(0.9147, grad_fn=<MeanBackward0>)
neg tensor(0.9538, grad_fn=<MeanBackward0>)
pos tensor(0.9084, grad_fn=<MeanBackward0>)
neg tensor(0.9496, grad_fn=<MeanBackward0>)
pos tensor(0.9442, grad_fn=<MeanBackward0>)
neg tensor(0.9539, grad_fn=<MeanBackward0>)
pos tensor(0.9259, grad_fn=<MeanBackward0>)
neg tensor(0.9426, grad_fn=<MeanBackward0>)
pos tensor(0.9209, grad_fn=<MeanBackward0>)
neg tensor(0.9635, grad_fn=<MeanBackward0>)
pos tensor(0.9365, grad_fn=<MeanBackward0>)
neg tensor(0.9454, grad_fn=<MeanBackward0>)
pos tensor(0.9033, grad_fn=<MeanBackward0>)
neg tensor(0.9521, grad_fn=<MeanBackward0>)
pos tensor(0.9186, grad_fn=<MeanBackward0>)
neg tensor(0.9524, grad_fn=<MeanBackward0>)
pos tensor(0.9201, grad_fn=<MeanBackward0>)
neg tensor(0.9473, grad_fn=<Mean

Training:   3%|█████▏                                                                                                                                                     | 45/1352 [00:11<05:02,  4.32it/s]

neg tensor(0.8679, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9483, grad_fn=<MeanBackward0>)
pos tensor(0.9000, grad_fn=<MeanBackward0>)
neg tensor(0.9355, grad_fn=<MeanBackward0>)
pos tensor(0.9205, grad_fn=<MeanBackward0>)
neg tensor(0.9442, grad_fn=<MeanBackward0>)
pos tensor(0.9249, grad_fn=<MeanBackward0>)
neg tensor(0.9551, grad_fn=<MeanBackward0>)
pos tensor(0.9210, grad_fn=<MeanBackward0>)
neg tensor(0.9338, grad_fn=<MeanBackward0>)
pos tensor(0.9115, grad_fn=<MeanBackward0>)
neg tensor(0.9531, grad_fn=<MeanBackward0>)
pos tensor(0.9323, grad_fn=<MeanBackward0>)
neg tensor(0.9482, grad_fn=<MeanBackward0>)
pos tensor(0.9194, grad_fn=<MeanBackward0>)
neg tensor(0.9397, grad_fn=<MeanBackward0>)
pos tensor(0.9461, grad_fn=<MeanBackward0>)
neg tensor(0.8923, grad_fn=<MeanBackward0>)
pos tensor(0.9035, grad_fn=<MeanBackward0>)
neg tensor(0.9050, grad_fn=<MeanBackward0>)
pos tensor(0.9194, grad_fn=<MeanBackward0>)
neg tensor(0.9284, grad_fn=<MeanBack

Training:   3%|█████▎                                                                                                                                                     | 46/1352 [00:11<04:54,  4.43it/s]

neg tensor(0.9513, grad_fn=<MeanBackward0>)
pos tensor(0.9271, grad_fn=<MeanBackward0>)
neg tensor(0.9239, grad_fn=<MeanBackward0>)
pos tensor(0.9471, grad_fn=<MeanBackward0>)
neg tensor(0.9106, grad_fn=<MeanBackward0>)
pos tensor(0.9013, grad_fn=<MeanBackward0>)
neg tensor(0.9374, grad_fn=<MeanBackward0>)
pos tensor(0.9237, grad_fn=<MeanBackward0>)
neg tensor(0.9458, grad_fn=<MeanBackward0>)
pos tensor(0.9111, grad_fn=<MeanBackward0>)
neg tensor(0.9443, grad_fn=<MeanBackward0>)
pos tensor(0.9126, grad_fn=<MeanBackward0>)
neg tensor(0.9296, grad_fn=<MeanBackward0>)
pos tensor(0.9228, grad_fn=<MeanBackward0>)
neg tensor(0.9524, grad_fn=<MeanBackward0>)
pos tensor(0.9081, grad_fn=<MeanBackward0>)
neg tensor(0.9261, grad_fn=<MeanBackward0>)
pos tensor(0.9012, grad_fn=<MeanBackward0>)
neg tensor(0.9312, grad_fn=<MeanBackward0>)
pos tensor(0.8966, grad_fn=<MeanBackward0>)
neg tensor(0.9299, grad_fn=<MeanBackward0>)
pos tensor(0.8862, grad_fn=<MeanBackward0>)
neg tensor(0.9591, grad_fn=<Mean

Training:   3%|█████▍                                                                                                                                                     | 47/1352 [00:11<04:33,  4.77it/s]

tensor(0.9560, grad_fn=<MeanBackward0>)
pos tensor(0.9280, grad_fn=<MeanBackward0>)
neg tensor(0.9226, grad_fn=<MeanBackward0>)
pos tensor(0.9079, grad_fn=<MeanBackward0>)
neg tensor(0.9434, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9411, grad_fn=<MeanBackward0>)
pos tensor(0.9234, grad_fn=<MeanBackward0>)
neg tensor(0.9508, grad_fn=<MeanBackward0>)
pos tensor(0.9138, grad_fn=<MeanBackward0>)
neg tensor(0.9527, grad_fn=<MeanBackward0>)
pos tensor(0.9187, grad_fn=<MeanBackward0>)
neg tensor(0.9239, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9596, grad_fn=<MeanBackward0>)
pos tensor(0.9290, grad_fn=<MeanBackward0>)
neg tensor(0.9562, grad_fn=<MeanBackward0>)
pos tensor(0.9302, grad_fn=<MeanBackward0>)
neg 

Training:   4%|█████▌                                                                                                                                                     | 48/1352 [00:11<04:40,  4.65it/s]

tensor(0.9487, grad_fn=<MeanBackward0>)
pos tensor(0.9114, grad_fn=<MeanBackward0>)
neg tensor(0.9603, grad_fn=<MeanBackward0>)
pos tensor(0.9400, grad_fn=<MeanBackward0>)
neg tensor(0.9543, grad_fn=<MeanBackward0>)
pos tensor(0.9264, grad_fn=<MeanBackward0>)
neg tensor(0.9525, grad_fn=<MeanBackward0>)
pos tensor(0.9434, grad_fn=<MeanBackward0>)
neg tensor(0.9583, grad_fn=<MeanBackward0>)
pos tensor(0.9224, grad_fn=<MeanBackward0>)
neg tensor(0.9532, grad_fn=<MeanBackward0>)
pos tensor(0.9148, grad_fn=<MeanBackward0>)
neg tensor(0.9439, grad_fn=<MeanBackward0>)
pos tensor(0.9374, grad_fn=<MeanBackward0>)
neg tensor(0.9514, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.8199, grad_fn=<MeanBackward0>)
pos tensor(0.9199, grad_fn=<MeanBackward0>)


Training:   4%|█████▌                                                                                                                                                     | 49/1352 [00:11<04:59,  4.35it/s]

neg tensor(0.9490, grad_fn=<MeanBackward0>)
pos tensor(0.9335, grad_fn=<MeanBackward0>)
neg tensor(0.9591, grad_fn=<MeanBackward0>)
pos tensor(0.9104, grad_fn=<MeanBackward0>)
neg tensor(0.9388, grad_fn=<MeanBackward0>)
pos tensor(0.9093, grad_fn=<MeanBackward0>)
neg tensor(0.9540, grad_fn=<MeanBackward0>)
pos tensor(0.9177, grad_fn=<MeanBackward0>)
neg tensor(0.9480, grad_fn=<MeanBackward0>)
pos tensor(0.9125, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9353, grad_fn=<MeanBackward0>)
neg tensor(0.9415, grad_fn=<MeanBackward0>)
pos tensor(0.9413, grad_fn=<MeanBackward0>)
neg tensor(0.9480, grad_fn=<MeanBackward0>)
pos tensor(0.9429, grad_fn=<MeanBackward0>)
neg tensor(0.9552, grad_fn=<MeanBackward0>)
pos tensor(0.9358, grad_fn=<MeanBackward0>)
neg tensor(0.9548, grad_fn=<MeanBackward0>)
pos tensor(0.9202, grad_fn=<MeanBackward0>)
neg tensor(0.9494, grad_fn=<MeanBackward0>)
pos tensor(0.9154, grad_fn=<MeanBackward0>)
neg tensor(0.9536, grad_fn=<Mean

Training:   4%|█████▋                                                                                                                                                     | 50/1352 [00:12<05:17,  4.11it/s]

neg tensor(0.9547, grad_fn=<MeanBackward0>)
pos tensor(0.9105, grad_fn=<MeanBackward0>)
neg tensor(0.9551, grad_fn=<MeanBackward0>)
pos tensor(0.9237, grad_fn=<MeanBackward0>)
neg tensor(0.9560, grad_fn=<MeanBackward0>)
pos tensor(0.9233, grad_fn=<MeanBackward0>)
neg tensor(0.9352, grad_fn=<MeanBackward0>)
pos tensor(0.9359, grad_fn=<MeanBackward0>)
neg tensor(0.9565, grad_fn=<MeanBackward0>)
pos tensor(0.9190, grad_fn=<MeanBackward0>)
neg tensor(0.9132, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9642, grad_fn=<MeanBackward0>)
pos tensor(0.9378, grad_fn=<MeanBackward0>)
neg tensor(0.9322, grad_fn=<MeanBackward0>)
pos tensor(0.9287, grad_fn=<MeanBackward0>)
neg tensor(0.9519, grad_fn=<MeanBackward0>)
pos tensor(0.9084, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9264, grad_fn=<MeanBackward0>)
neg tensor(0.9570, grad_fn=<MeanBackward0>)
pos tensor(0.9315, grad_fn=<MeanBackward0>)
neg tensor(0.9403, grad_fn=<Mean

Training:   4%|█████▊                                                                                                                                                     | 51/1352 [00:12<05:08,  4.21it/s]

neg tensor(0.9597, grad_fn=<MeanBackward0>)
pos tensor(0.9216, grad_fn=<MeanBackward0>)
neg tensor(0.9433, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9446, grad_fn=<MeanBackward0>)
pos tensor(0.9262, grad_fn=<MeanBackward0>)
neg tensor(0.9546, grad_fn=<MeanBackward0>)
pos tensor(0.9183, grad_fn=<MeanBackward0>)
neg tensor(0.9518, grad_fn=<MeanBackward0>)
pos tensor(0.9297, grad_fn=<MeanBackward0>)
neg tensor(0.9450, grad_fn=<MeanBackward0>)
pos tensor(0.9196, grad_fn=<MeanBackward0>)
neg tensor(0.9100, grad_fn=<MeanBackward0>)
pos tensor(0.9067, grad_fn=<MeanBackward0>)
neg tensor(0.9598, grad_fn=<MeanBackward0>)
pos tensor(0.9164, grad_fn=<MeanBackward0>)
neg tensor(0.9354, grad_fn=<MeanBackward0>)
pos tensor(0.9299, grad_fn=<MeanBackward0>)
neg tensor(0.9572, grad_fn=<MeanBackward0>)
pos tensor(0.9315, grad_fn=<MeanBackward0>)
neg tensor(0.9594, grad_fn=<MeanBackward0>)
pos tensor(0.9364, grad_fn=<MeanBackward0>)
neg tensor(0.9549, grad_fn=<Mean

Training:   4%|█████▉                                                                                                                                                     | 52/1352 [00:12<05:08,  4.21it/s]

neg tensor(0.9526, grad_fn=<MeanBackward0>)
pos tensor(0.9127, grad_fn=<MeanBackward0>)
neg tensor(0.9544, grad_fn=<MeanBackward0>)
pos tensor(0.9120, grad_fn=<MeanBackward0>)
neg tensor(0.9499, grad_fn=<MeanBackward0>)
pos tensor(0.9147, grad_fn=<MeanBackward0>)
neg tensor(0.9594, grad_fn=<MeanBackward0>)
pos tensor(0.9315, grad_fn=<MeanBackward0>)
neg tensor(0.9589, grad_fn=<MeanBackward0>)
pos tensor(0.9370, grad_fn=<MeanBackward0>)
neg tensor(0.9093, grad_fn=<MeanBackward0>)
pos tensor(0.9268, grad_fn=<MeanBackward0>)
neg tensor(0.9524, grad_fn=<MeanBackward0>)
pos tensor(0.9340, grad_fn=<MeanBackward0>)
neg tensor(0.9440, grad_fn=<MeanBackward0>)
pos tensor(0.9038, grad_fn=<MeanBackward0>)
neg tensor(0.9524, grad_fn=<MeanBackward0>)
pos tensor(0.9167, grad_fn=<MeanBackward0>)
neg tensor(0.9540, grad_fn=<MeanBackward0>)
pos tensor(0.9234, grad_fn=<MeanBackward0>)
neg tensor(0.9400, grad_fn=<MeanBackward0>)
pos tensor(0.9185, grad_fn=<MeanBackward0>)
neg tensor(0.9572, grad_fn=<Mean

Training:   4%|██████                                                                                                                                                     | 53/1352 [00:12<05:03,  4.28it/s]

neg tensor(0.9457, grad_fn=<MeanBackward0>)
pos tensor(0.9267, grad_fn=<MeanBackward0>)
neg tensor(0.7475, grad_fn=<MeanBackward0>)
pos tensor(0.9011, grad_fn=<MeanBackward0>)
neg tensor(0.9496, grad_fn=<MeanBackward0>)
pos tensor(0.9194, grad_fn=<MeanBackward0>)
neg tensor(0.9465, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9393, grad_fn=<MeanBackward0>)
pos tensor(0.9359, grad_fn=<MeanBackward0>)
neg tensor(0.9356, grad_fn=<MeanBackward0>)
pos tensor(0.9218, grad_fn=<MeanBackward0>)
neg tensor(0.9543, grad_fn=<MeanBackward0>)
pos tensor(0.9313, grad_fn=<MeanBackward0>)
neg tensor(0.9632, grad_fn=<MeanBackward0>)
pos tensor(0.9487, grad_fn=<MeanBackward0>)
neg tensor(0.9452, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9567, grad_fn=<MeanBackward0>)
pos tensor(0.9368, grad_fn=<MeanBackward0>)
neg tensor(0.9549, grad_fn=<MeanBackward0>)
pos tensor(0.9101, grad_fn=<MeanBackward0>)
neg tensor(0.9569, grad_fn=<Mean

Training:   4%|██████▏                                                                                                                                                    | 54/1352 [00:13<05:15,  4.11it/s]

neg tensor(0.9600, grad_fn=<MeanBackward0>)
pos tensor(0.9103, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9463, grad_fn=<MeanBackward0>)
pos tensor(0.9278, grad_fn=<MeanBackward0>)
neg tensor(0.9558, grad_fn=<MeanBackward0>)
pos tensor(0.9083, grad_fn=<MeanBackward0>)
neg tensor(0.9540, grad_fn=<MeanBackward0>)
pos tensor(0.9237, grad_fn=<MeanBackward0>)
neg tensor(0.9489, grad_fn=<MeanBackward0>)
pos tensor(0.9471, grad_fn=<MeanBackward0>)
neg tensor(0.9434, grad_fn=<MeanBackward0>)
pos tensor(0.9335, grad_fn=<MeanBackward0>)
neg tensor(0.9590, grad_fn=<MeanBackward0>)
pos tensor(0.9239, grad_fn=<MeanBackward0>)
neg tensor(0.9553, grad_fn=<MeanBackward0>)
pos tensor(0.9288, grad_fn=<MeanBackward0>)
neg tensor(0.9631, grad_fn=<MeanBackward0>)
pos tensor(0.9332, grad_fn=<MeanBackward0>)
neg tensor(0.7523, grad_fn=<MeanBackward0>)
pos tensor(0.8986, grad_fn=<MeanBackward0>)
neg tensor(0.9553, grad_fn=<MeanBac

Training:   4%|██████▎                                                                                                                                                    | 55/1352 [00:13<05:36,  3.85it/s]

neg tensor(0.9562, grad_fn=<MeanBackward0>)
pos tensor(0.9292, grad_fn=<MeanBackward0>)
neg tensor(0.9613, grad_fn=<MeanBackward0>)
pos tensor(0.9301, grad_fn=<MeanBackward0>)
neg tensor(0.9436, grad_fn=<MeanBackward0>)
pos tensor(0.9123, grad_fn=<MeanBackward0>)
neg tensor(0.9422, grad_fn=<MeanBackward0>)
pos tensor(0.9438, grad_fn=<MeanBackward0>)
neg tensor(0.9609, grad_fn=<MeanBackward0>)
pos tensor(0.9368, grad_fn=<MeanBackward0>)
neg tensor(0.9562, grad_fn=<MeanBackward0>)
pos tensor(0.9222, grad_fn=<MeanBackward0>)
neg tensor(0.9645, grad_fn=<MeanBackward0>)
pos tensor(0.9351, grad_fn=<MeanBackward0>)
neg tensor(0.9537, grad_fn=<MeanBackward0>)
pos tensor(0.9112, grad_fn=<MeanBackward0>)
neg tensor(0.9346, grad_fn=<MeanBackward0>)
pos tensor(0.9003, grad_fn=<MeanBackward0>)
neg tensor(0.9644, grad_fn=<MeanBackward0>)
pos tensor(0.9202, grad_fn=<MeanBackward0>)
neg tensor(0.9592, grad_fn=<MeanBackward0>)
pos tensor(0.9479, grad_fn=<MeanBackward0>)
neg tensor(0.9626, grad_fn=<Mean

Training:   4%|██████▍                                                                                                                                                    | 56/1352 [00:13<05:36,  3.85it/s]

neg tensor(0.9599, grad_fn=<MeanBackward0>)
pos tensor(0.9419, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9449, grad_fn=<MeanBackward0>)
neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(0.9258, grad_fn=<MeanBackward0>)
neg tensor(0.9385, grad_fn=<MeanBackward0>)
pos tensor(0.9442, grad_fn=<MeanBackward0>)
neg tensor(0.9339, grad_fn=<MeanBackward0>)
pos tensor(0.9301, grad_fn=<MeanBackward0>)
neg tensor(0.9579, grad_fn=<MeanBackward0>)
pos tensor(0.9387, grad_fn=<MeanBackward0>)
neg tensor(0.9594, grad_fn=<MeanBackward0>)
pos tensor(0.9241, grad_fn=<MeanBackward0>)
neg tensor(0.9514, grad_fn=<MeanBackward0>)
pos tensor(0.9152, grad_fn=<MeanBackward0>)
neg tensor(0.9319, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.9437, grad_fn=<MeanBackward0>)
pos tensor(0.9095, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9236, grad_fn=<MeanBackward0>)
neg tensor(0.9505, grad_fn=<Mean

Training:   4%|██████▌                                                                                                                                                    | 57/1352 [00:13<05:31,  3.90it/s]

neg tensor(0.9560, grad_fn=<MeanBackward0>)
pos tensor(0.9535, grad_fn=<MeanBackward0>)
neg tensor(0.9580, grad_fn=<MeanBackward0>)
pos tensor(0.9360, grad_fn=<MeanBackward0>)
neg tensor(0.9585, grad_fn=<MeanBackward0>)
pos tensor(0.9288, grad_fn=<MeanBackward0>)
neg tensor(0.9574, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9373, grad_fn=<MeanBackward0>)
neg tensor(0.9682, grad_fn=<MeanBackward0>)
pos tensor(0.9378, grad_fn=<MeanBackward0>)
neg tensor(0.9509, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9633, grad_fn=<MeanBackward0>)
pos tensor(0.9348, grad_fn=<MeanBackward0>)
neg tensor(0.9483, grad_fn=<MeanBackward0>)
pos tensor(0.9224, grad_fn=<MeanBackward0>)
neg tensor(0.9558, grad_fn=<MeanBackward0>)
pos tensor(0.9378, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9313, grad_fn=<MeanBackward0>)
neg tensor(0.9562, grad_fn=<Mean

Training:   4%|██████▋                                                                                                                                                    | 58/1352 [00:14<05:32,  3.89it/s]

neg tensor(0.9627, grad_fn=<MeanBackward0>)
pos tensor(0.9297, grad_fn=<MeanBackward0>)
neg tensor(0.9425, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9420, grad_fn=<MeanBackward0>)
pos tensor(0.9169, grad_fn=<MeanBackward0>)
neg tensor(0.9604, grad_fn=<MeanBackward0>)
pos tensor(0.9211, grad_fn=<MeanBackward0>)
neg tensor(0.9565, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9636, grad_fn=<MeanBackward0>)
pos tensor(0.9295, grad_fn=<MeanBackward0>)
neg tensor(0.9570, grad_fn=<MeanBackward0>)
pos tensor(0.9342, grad_fn=<MeanBackward0>)
neg tensor(0.9513, grad_fn=<MeanBackward0>)
pos tensor(0.9216, grad_fn=<MeanBackward0>)
neg tensor(0.9574, grad_fn=<MeanBackward0>)
pos tensor(0.9155, grad_fn=<MeanBackward0>)
neg tensor(0.9621, grad_fn=<MeanBackward0>)
pos tensor(0.9145, grad_fn=<MeanBackward0>)
neg tensor(0.9494, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9579, grad_fn=<Mean

Training:   4%|██████▊                                                                                                                                                    | 59/1352 [00:14<05:20,  4.03it/s]

neg tensor(0.9633, grad_fn=<MeanBackward0>)
pos tensor(0.9269, grad_fn=<MeanBackward0>)
neg tensor(0.8688, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9199, grad_fn=<MeanBackward0>)
pos tensor(0.9141, grad_fn=<MeanBackward0>)
neg tensor(0.0957, grad_fn=<MeanBackward0>)
pos tensor(0.9249, grad_fn=<MeanBackward0>)
neg tensor(0.9587, grad_fn=<MeanBackward0>)
pos tensor(0.9385, grad_fn=<MeanBackward0>)
neg tensor(0.9420, grad_fn=<MeanBackward0>)
pos tensor(0.9438, grad_fn=<MeanBackward0>)
neg tensor(0.9671, grad_fn=<MeanBackward0>)
pos tensor(0.9331, grad_fn=<MeanBackward0>)
neg tensor(0.9575, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.9367, grad_fn=<MeanBackward0>)
pos tensor(0.9248, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9481, grad_fn=<MeanBackward0>)
neg tensor(0.9610, grad_fn=<MeanBackward0>)
pos tensor(0.9374, grad_fn=<MeanBackward0>)
neg tensor(0.9500, grad_fn=<Mean

Training:   4%|██████▉                                                                                                                                                    | 60/1352 [00:14<05:38,  3.82it/s]

neg tensor(0.9598, grad_fn=<MeanBackward0>)
pos tensor(0.9343, grad_fn=<MeanBackward0>)
neg tensor(0.9650, grad_fn=<MeanBackward0>)
pos tensor(0.9332, grad_fn=<MeanBackward0>)
neg tensor(0.9607, grad_fn=<MeanBackward0>)
pos tensor(0.9229, grad_fn=<MeanBackward0>)
neg tensor(0.9524, grad_fn=<MeanBackward0>)
pos tensor(0.9132, grad_fn=<MeanBackward0>)
neg tensor(0.9637, grad_fn=<MeanBackward0>)
pos tensor(0.9377, grad_fn=<MeanBackward0>)
neg tensor(0.9586, grad_fn=<MeanBackward0>)
pos tensor(0.9274, grad_fn=<MeanBackward0>)
neg tensor(0.9518, grad_fn=<MeanBackward0>)
pos tensor(0.9488, grad_fn=<MeanBackward0>)
neg tensor(0.9577, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9573, grad_fn=<MeanBackward0>)
pos tensor(0.9328, grad_fn=<MeanBackward0>)
neg tensor(0.9611, grad_fn=<MeanBackward0>)
pos tensor(0.9253, grad_fn=<MeanBackward0>)
neg tensor(0.9609, grad_fn=<MeanBackward0>)
pos tensor(0.9301, grad_fn=<MeanBackward0>)
neg tensor(0.9628, grad_fn=<Mean

Training:   5%|██████▉                                                                                                                                                    | 61/1352 [00:15<05:44,  3.75it/s]

neg tensor(0.9660, grad_fn=<MeanBackward0>)
pos tensor(0.9315, grad_fn=<MeanBackward0>)
neg tensor(0.9563, grad_fn=<MeanBackward0>)
pos tensor(0.9334, grad_fn=<MeanBackward0>)
neg tensor(0.9579, grad_fn=<MeanBackward0>)
pos tensor(0.9356, grad_fn=<MeanBackward0>)
neg tensor(0.9332, grad_fn=<MeanBackward0>)
pos tensor(0.9268, grad_fn=<MeanBackward0>)
neg tensor(0.9402, grad_fn=<MeanBackward0>)
pos tensor(0.9272, grad_fn=<MeanBackward0>)
neg tensor(0.9568, grad_fn=<MeanBackward0>)
pos tensor(0.9324, grad_fn=<MeanBackward0>)
neg tensor(0.9635, grad_fn=<MeanBackward0>)
pos tensor(0.9402, grad_fn=<MeanBackward0>)
neg tensor(0.9533, grad_fn=<MeanBackward0>)
pos tensor(0.9346, grad_fn=<MeanBackward0>)
neg tensor(0.9619, grad_fn=<MeanBackward0>)
pos tensor(0.9280, grad_fn=<MeanBackward0>)
neg tensor(0.9654, grad_fn=<MeanBackward0>)
pos tensor(0.9418, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9362, grad_fn=<MeanBackward0>)
neg tensor(0.9413, grad_fn=<Mean

Training:   5%|███████                                                                                                                                                    | 62/1352 [00:15<05:55,  3.62it/s]

neg tensor(0.9647, grad_fn=<MeanBackward0>)
pos tensor(0.9194, grad_fn=<MeanBackward0>)
neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(0.9221, grad_fn=<MeanBackward0>)
neg tensor(0.9609, grad_fn=<MeanBackward0>)
pos tensor(0.9401, grad_fn=<MeanBackward0>)
neg tensor(0.9592, grad_fn=<MeanBackward0>)
pos tensor(0.9438, grad_fn=<MeanBackward0>)
neg tensor(0.9552, grad_fn=<MeanBackward0>)
pos tensor(0.9211, grad_fn=<MeanBackward0>)
neg tensor(0.9597, grad_fn=<MeanBackward0>)
pos tensor(0.9316, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9427, grad_fn=<MeanBackward0>)
neg tensor(0.9598, grad_fn=<MeanBackward0>)
pos tensor(0.9302, grad_fn=<MeanBackward0>)
neg tensor(0.9688, grad_fn=<MeanBackward0>)
pos tensor(0.9402, grad_fn=<MeanBackward0>)
neg tensor(0.9589, grad_fn=<MeanBackward0>)
pos tensor(0.9436, grad_fn=<MeanBackward0>)
neg tensor(0.9560, grad_fn=<MeanBackward0>)
pos tensor(0.9289, grad_fn=<MeanBackward0>)
neg tensor(0.9634, grad_fn=<Mean

Training:   5%|███████▏                                                                                                                                                   | 63/1352 [00:15<05:42,  3.76it/s]

neg tensor(0.9553, grad_fn=<MeanBackward0>)
pos tensor(0.9377, grad_fn=<MeanBackward0>)
neg tensor(0.9585, grad_fn=<MeanBackward0>)
pos tensor(0.9250, grad_fn=<MeanBackward0>)
neg tensor(0.9415, grad_fn=<MeanBackward0>)
pos tensor(0.9475, grad_fn=<MeanBackward0>)
neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(0.9363, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9407, grad_fn=<MeanBackward0>)
neg tensor(0.9699, grad_fn=<MeanBackward0>)
pos tensor(0.9385, grad_fn=<MeanBackward0>)
neg tensor(0.9147, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9413, grad_fn=<MeanBackward0>)
pos tensor(0.9261, grad_fn=<MeanBackward0>)
neg tensor(0.9652, grad_fn=<MeanBackward0>)
pos tensor(0.9449, grad_fn=<MeanBackward0>)
neg tensor(0.9585, grad_fn=<MeanBackward0>)
pos tensor(0.9518, grad_fn=<MeanBackward0>)
neg tensor(0.9514, grad_fn=<MeanBackward0>)
pos tensor(0.9230, grad_fn=<MeanBackward0>)
neg tensor(0.9601, grad_fn=<MeanBack

Training:   5%|███████▎                                                                                                                                                   | 64/1352 [00:15<05:29,  3.91it/s]

neg tensor(0.7124, grad_fn=<MeanBackward0>)
pos tensor(0.9553, grad_fn=<MeanBackward0>)
neg tensor(0.9639, grad_fn=<MeanBackward0>)
pos tensor(0.9375, grad_fn=<MeanBackward0>)
neg tensor(0.9554, grad_fn=<MeanBackward0>)
pos tensor(0.9464, grad_fn=<MeanBackward0>)
neg tensor(0.9386, grad_fn=<MeanBackward0>)
pos tensor(0.9228, grad_fn=<MeanBackward0>)
neg tensor(0.9660, grad_fn=<MeanBackward0>)
pos tensor(0.9305, grad_fn=<MeanBackward0>)
neg tensor(0.9621, grad_fn=<MeanBackward0>)
pos tensor(0.9387, grad_fn=<MeanBackward0>)
neg tensor(0.9389, grad_fn=<MeanBackward0>)
pos tensor(0.9423, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9279, grad_fn=<MeanBackward0>)
neg tensor(0.9431, grad_fn=<MeanBackward0>)
pos tensor(0.9309, grad_fn=<MeanBackward0>)
neg tensor(0.9504, grad_fn=<MeanBackward0>)
pos tensor(0.9606, grad_fn=<MeanBackward0>)
neg tensor(0.9577, grad_fn=<MeanBackward0>)
pos tensor(0.9360, grad_fn=<MeanBackward0>)
neg tensor(0.9405, grad_fn=<Mean

Training:   5%|███████▍                                                                                                                                                   | 65/1352 [00:16<05:18,  4.04it/s]

neg tensor(0.9557, grad_fn=<MeanBackward0>)
pos tensor(0.9469, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9373, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9375, grad_fn=<MeanBackward0>)
neg tensor(0.9587, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9365, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9484, grad_fn=<MeanBackward0>)
neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9371, grad_fn=<MeanBackward0>)
neg tensor(0.4367, grad_fn=<MeanBackward0>)
pos tensor(0.9259, grad_fn=<MeanBackward0>)
neg tensor(0.9682, grad_fn=<MeanBackward0>)
pos tensor(0.9453, grad_fn=<MeanBackward0>)
neg tensor(0.9668, grad_fn=<MeanBackward0>)
pos tensor(0.9514, grad_fn=<MeanBackward0>)
neg tensor(0.9658, grad_fn=<MeanBackward0>)
pos tensor(0.9305, grad_fn=<MeanBackward0>)
neg tensor(0.9299, grad_fn=<Mean

Training:   5%|███████▌                                                                                                                                                   | 66/1352 [00:16<05:21,  4.00it/s]

neg tensor(0.9582, grad_fn=<MeanBackward0>)
pos tensor(0.9490, grad_fn=<MeanBackward0>)
neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9333, grad_fn=<MeanBackward0>)
neg tensor(0.9554, grad_fn=<MeanBackward0>)
pos tensor(0.9595, grad_fn=<MeanBackward0>)
neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9394, grad_fn=<MeanBackward0>)
neg tensor(0.9647, grad_fn=<MeanBackward0>)
pos tensor(0.9361, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9383, grad_fn=<MeanBackward0>)
neg tensor(0.9544, grad_fn=<MeanBackward0>)
pos tensor(0.9236, grad_fn=<MeanBackward0>)
neg tensor(0.9636, grad_fn=<MeanBackward0>)
pos tensor(0.9228, grad_fn=<MeanBackward0>)
neg tensor(0.9640, grad_fn=<MeanBackward0>)
pos tensor(0.9565, grad_fn=<MeanBackward0>)
neg tensor(0.9399, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9623, grad_fn=<MeanBackward0>)
pos tensor(0.9317, grad_fn=<MeanBackward0>)
neg tensor(0.9633, grad_fn=<Mean

Training:   5%|███████▋                                                                                                                                                   | 67/1352 [00:16<05:09,  4.15it/s]

neg tensor(0.9658, grad_fn=<MeanBackward0>)
pos tensor(0.9422, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<MeanBackward0>)
pos tensor(0.9399, grad_fn=<MeanBackward0>)
neg tensor(0.9618, grad_fn=<MeanBackward0>)
pos tensor(0.9394, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9232, grad_fn=<MeanBackward0>)
neg tensor(0.9650, grad_fn=<MeanBackward0>)
pos tensor(0.9467, grad_fn=<MeanBackward0>)
neg tensor(0.9611, grad_fn=<MeanBackward0>)
pos tensor(0.9498, grad_fn=<MeanBackward0>)
neg tensor(0.9571, grad_fn=<MeanBackward0>)
pos tensor(0.9425, grad_fn=<MeanBackward0>)
neg tensor(0.9649, grad_fn=<MeanBackward0>)
pos tensor(0.9368, grad_fn=<MeanBackward0>)
neg tensor(0.9499, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9633, grad_fn=<MeanBackward0>)
pos tensor(0.9429, grad_fn=<MeanBackward0>)
neg tensor(0.9578, grad_fn=<MeanBackward0>)
pos tensor(0.9446, grad_fn=<MeanBackward0>)
neg tensor(0.9662, grad_fn=<Mean

Training:   5%|███████▊                                                                                                                                                   | 68/1352 [00:16<05:03,  4.22it/s]

neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9447, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9376, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9386, grad_fn=<MeanBackward0>)
neg tensor(0.9636, grad_fn=<MeanBackward0>)
pos tensor(0.9522, grad_fn=<MeanBackward0>)
neg tensor(0.9705, grad_fn=<MeanBackward0>)
pos tensor(0.9409, grad_fn=<MeanBackward0>)
neg tensor(0.9169, grad_fn=<MeanBackward0>)
pos tensor(0.9313, grad_fn=<MeanBackward0>)
neg tensor(0.9590, grad_fn=<MeanBackward0>)
pos tensor(0.9424, grad_fn=<MeanBackward0>)
neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9518, grad_fn=<MeanBackward0>)
neg tensor(0.9649, grad_fn=<MeanBackward0>)
pos tensor(0.9381, grad_fn=<MeanBackward0>)
neg tensor(0.9502, grad_fn=<MeanBackward0>)
pos tensor(0.9371, grad_fn=<MeanBackward0>)
neg tensor(0.9585, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<Mean

Training:   5%|███████▉                                                                                                                                                   | 69/1352 [00:17<05:07,  4.17it/s]

neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9457, grad_fn=<MeanBackward0>)
neg tensor(0.5906, grad_fn=<MeanBackward0>)
pos tensor(0.9382, grad_fn=<MeanBackward0>)
neg tensor(0.9667, grad_fn=<MeanBackward0>)
pos tensor(0.9353, grad_fn=<MeanBackward0>)
neg tensor(0.9623, grad_fn=<MeanBackward0>)
pos tensor(0.9435, grad_fn=<MeanBackward0>)
neg tensor(0.9548, grad_fn=<MeanBackward0>)
pos tensor(0.9536, grad_fn=<MeanBackward0>)
neg tensor(0.9483, grad_fn=<MeanBackward0>)
pos tensor(0.9509, grad_fn=<MeanBackward0>)
neg tensor(0.9672, grad_fn=<MeanBackward0>)
pos tensor(0.9353, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9477, grad_fn=<MeanBackward0>)
neg tensor(0.9583, grad_fn=<MeanBackward0>)
pos tensor(0.9487, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9385, grad_fn=<MeanBackward0>)
neg tensor(0.9489, grad_fn=<MeanBackward0>)
pos tensor(0.9535, grad_fn=<MeanBackward0>)
neg tensor(0.9564, grad_fn=<Mean

Training:   5%|████████                                                                                                                                                   | 70/1352 [00:17<05:11,  4.11it/s]

neg tensor(0.9623, grad_fn=<MeanBackward0>)
pos tensor(0.9333, grad_fn=<MeanBackward0>)
neg tensor(0.9540, grad_fn=<MeanBackward0>)
pos tensor(0.9366, grad_fn=<MeanBackward0>)
neg tensor(0.9487, grad_fn=<MeanBackward0>)
pos tensor(0.9261, grad_fn=<MeanBackward0>)
neg tensor(0.9620, grad_fn=<MeanBackward0>)
pos tensor(0.9387, grad_fn=<MeanBackward0>)
neg tensor(0.9705, grad_fn=<MeanBackward0>)
pos tensor(0.9431, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9519, grad_fn=<MeanBackward0>)
pos tensor(0.9477, grad_fn=<MeanBackward0>)
neg tensor(0.8208, grad_fn=<MeanBackward0>)
pos tensor(0.9307, grad_fn=<MeanBackward0>)
neg tensor(0.9673, grad_fn=<MeanBackward0>)
pos tensor(0.9358, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9357, grad_fn=<MeanBackward0>)
neg tensor(0.9655, grad_fn=<MeanBackward0>)
pos tensor(0.9347, grad_fn=<MeanBackward0>)
neg tensor(0.9646, grad_fn=<Mean

Training:   5%|████████▏                                                                                                                                                  | 71/1352 [00:17<05:08,  4.15it/s]

neg tensor(0.9496, grad_fn=<MeanBackward0>)
pos tensor(0.9605, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)
neg tensor(0.9562, grad_fn=<MeanBackward0>)
pos tensor(0.9330, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9441, grad_fn=<MeanBackward0>)
neg tensor(0.9649, grad_fn=<MeanBackward0>)
pos tensor(0.9540, grad_fn=<MeanBackward0>)
neg tensor(0.9612, grad_fn=<MeanBackward0>)
pos tensor(0.9599, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9195, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9462, grad_fn=<MeanBackward0>)
neg tensor(0.9603, grad_fn=<MeanBackward0>)
pos tensor(0.9260, grad_fn=<MeanBackward0>)
neg tensor(0.9614, grad_fn=<MeanBackward0>)
pos tensor(0.9436, grad_fn=<MeanBackward0>)
neg tensor(0.9707, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9661, grad_fn=<Mean

Training:   5%|████████▎                                                                                                                                                  | 72/1352 [00:17<05:15,  4.05it/s]

neg tensor(0.9604, grad_fn=<MeanBackward0>)
pos tensor(0.9423, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9458, grad_fn=<MeanBackward0>)
neg tensor(0.9645, grad_fn=<MeanBackward0>)
pos tensor(0.9344, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9352, grad_fn=<MeanBackward0>)
neg tensor(0.9681, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9491, grad_fn=<MeanBackward0>)
pos tensor(0.9549, grad_fn=<MeanBackward0>)
neg tensor(0.9245, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9452, grad_fn=<MeanBackward0>)
neg tensor(0.9660, grad_fn=<MeanBackward0>)
pos tensor(0.9576, grad_fn=<MeanBackward0>)
neg tensor(0.9704, grad_fn=<MeanBackward0>)
pos tensor(0.9443, grad_fn=<MeanBackward0>)
neg tensor(0.9673, grad_fn=<MeanBackward0>)
pos tensor(0.9385, grad_fn=<MeanBackward0>)
neg tensor(0.9281, grad_fn=<Mean

Training:   5%|████████▎                                                                                                                                                  | 73/1352 [00:18<05:24,  3.94it/s]

neg tensor(0.9619, grad_fn=<MeanBackward0>)
pos tensor(0.9479, grad_fn=<MeanBackward0>)
neg tensor(0.9618, grad_fn=<MeanBackward0>)
pos tensor(0.9402, grad_fn=<MeanBackward0>)
neg tensor(0.9498, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9578, grad_fn=<MeanBackward0>)
pos tensor(0.9399, grad_fn=<MeanBackward0>)
neg tensor(0.9652, grad_fn=<MeanBackward0>)
pos tensor(0.9451, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9288, grad_fn=<MeanBackward0>)
neg tensor(0.9607, grad_fn=<MeanBackward0>)
pos tensor(0.9437, grad_fn=<MeanBackward0>)
neg tensor(0.9572, grad_fn=<MeanBackward0>)
pos tensor(0.9396, grad_fn=<MeanBackward0>)
neg tensor(0.9676, grad_fn=<MeanBackward0>)
pos tensor(0.9443, grad_fn=<MeanBackward0>)
neg tensor(0.9683, grad_fn=<MeanBackward0>)
pos tensor(0.9386, grad_fn=<MeanBackward0>)
neg tensor(0.9643, grad_fn=<MeanBackward0>)
pos tensor(0.9366, grad_fn=<MeanBackward0>)
neg tensor(0.9640, grad_fn=<Mean

Training:   5%|████████▍                                                                                                                                                  | 74/1352 [00:18<06:15,  3.40it/s]

neg tensor(0.9645, grad_fn=<MeanBackward0>)
pos tensor(0.9392, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<MeanBackward0>)
pos tensor(0.9379, grad_fn=<MeanBackward0>)
neg tensor(0.9693, grad_fn=<MeanBackward0>)
pos tensor(0.9454, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9508, grad_fn=<MeanBackward0>)
neg tensor(0.9567, grad_fn=<MeanBackward0>)
pos tensor(0.9363, grad_fn=<MeanBackward0>)
neg tensor(0.9667, grad_fn=<MeanBackward0>)
pos tensor(0.9408, grad_fn=<MeanBackward0>)
neg tensor(0.9310, grad_fn=<MeanBackward0>)
pos tensor(0.9294, grad_fn=<MeanBackward0>)
neg tensor(0.9704, grad_fn=<MeanBackward0>)
pos tensor(0.9333, grad_fn=<MeanBackward0>)
neg tensor(0.9688, grad_fn=<MeanBackward0>)
pos tensor(0.9384, grad_fn=<MeanBackward0>)
neg tensor(0.9665, grad_fn=<MeanBackward0>)
pos tensor(0.9361, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9377, grad_fn=<MeanBackward0>)
neg tensor(0.9693, grad_fn=<Mean

Training:   6%|████████▌                                                                                                                                                  | 75/1352 [00:18<05:46,  3.69it/s]

neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9415, grad_fn=<MeanBackward0>)
neg tensor(0.9648, grad_fn=<MeanBackward0>)
pos tensor(0.9523, grad_fn=<MeanBackward0>)
neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9538, grad_fn=<MeanBackward0>)
neg tensor(0.9580, grad_fn=<MeanBackward0>)
pos tensor(0.9500, grad_fn=<MeanBackward0>)
neg tensor(0.9667, grad_fn=<MeanBackward0>)
pos tensor(0.9300, grad_fn=<MeanBackward0>)
neg tensor(0.9648, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9659, grad_fn=<MeanBackward0>)
pos tensor(0.9481, grad_fn=<MeanBackward0>)
neg tensor(0.9632, grad_fn=<MeanBackward0>)
pos tensor(0.9469, grad_fn=<MeanBackward0>)
neg tensor(0.9662, grad_fn=<MeanBackward0>)
pos tensor(0.9408, grad_fn=<MeanBackward0>)
neg tensor(0.9582, grad_fn=<MeanBackward0>)
pos tensor(0.9430, grad_fn=<MeanBackward0>)
neg tensor(0.9532, grad_fn=<MeanBack

Training:   6%|████████▋                                                                                                                                                  | 76/1352 [00:18<05:58,  3.56it/s]

neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9415, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9488, grad_fn=<MeanBackward0>)
neg tensor(0.9593, grad_fn=<MeanBackward0>)
pos tensor(0.9459, grad_fn=<MeanBackward0>)
neg tensor(0.9688, grad_fn=<MeanBackward0>)
pos tensor(0.9452, grad_fn=<MeanBackward0>)
neg tensor(0.9508, grad_fn=<MeanBackward0>)
pos tensor(0.9611, grad_fn=<MeanBackward0>)
neg tensor(0.9651, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)
neg tensor(0.9589, grad_fn=<MeanBackward0>)
pos tensor(0.9325, grad_fn=<MeanBackward0>)
neg tensor(0.9649, grad_fn=<MeanBackward0>)
pos tensor(0.9431, grad_fn=<MeanBackward0>)
neg tensor(0.9672, grad_fn=<MeanBackward0>)
pos tensor(0.9380, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9337, grad_fn=<MeanBackward0>)
neg tensor(0.9640, grad_fn=<MeanBackward0>)
pos tensor(0.9474, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<Mean

Training:   6%|████████▊                                                                                                                                                  | 77/1352 [00:19<05:45,  3.69it/s]

neg tensor(0.9544, grad_fn=<MeanBackward0>)
pos tensor(0.9254, grad_fn=<MeanBackward0>)
neg tensor(0.9629, grad_fn=<MeanBackward0>)
pos tensor(0.9386, grad_fn=<MeanBackward0>)
neg tensor(0.9662, grad_fn=<MeanBackward0>)
pos tensor(0.9500, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9405, grad_fn=<MeanBackward0>)
neg tensor(0.9484, grad_fn=<MeanBackward0>)
pos tensor(0.9179, grad_fn=<MeanBackward0>)
neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9459, grad_fn=<MeanBackward0>)
neg tensor(0.9685, grad_fn=<MeanBackward0>)
pos tensor(0.9466, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9394, grad_fn=<MeanBackward0>)
neg tensor(0.9543, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9650, grad_fn=<MeanBackward0>)
pos tensor(0.9314, grad_fn=<MeanBackward0>)
neg tensor(0.9597, grad_fn=<MeanBackward0>)
pos tensor(0.9506, grad_fn=<MeanBackward0>)
neg tensor(0.9638, grad_fn=<Mean

Training:   6%|████████▉                                                                                                                                                  | 78/1352 [00:19<05:37,  3.77it/s]

neg tensor(0.9699, grad_fn=<MeanBackward0>)
pos tensor(0.9467, grad_fn=<MeanBackward0>)
neg tensor(0.9681, grad_fn=<MeanBackward0>)
pos tensor(0.9614, grad_fn=<MeanBackward0>)
neg tensor(0.9663, grad_fn=<MeanBackward0>)
pos tensor(0.9470, grad_fn=<MeanBackward0>)
neg tensor(0.9672, grad_fn=<MeanBackward0>)
pos tensor(0.9404, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9442, grad_fn=<MeanBackward0>)
neg tensor(0.9625, grad_fn=<MeanBackward0>)
pos tensor(0.9465, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.9634, grad_fn=<MeanBackward0>)
pos tensor(0.9393, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9358, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9519, grad_fn=<MeanBackward0>)
neg tensor(0.9326, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<Mean

Training:   6%|█████████                                                                                                                                                  | 79/1352 [00:19<05:32,  3.83it/s]

neg tensor(0.9692, grad_fn=<MeanBackward0>)
pos tensor(0.9386, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9430, grad_fn=<MeanBackward0>)
neg tensor(0.9683, grad_fn=<MeanBackward0>)
pos tensor(0.9508, grad_fn=<MeanBackward0>)
neg tensor(0.9659, grad_fn=<MeanBackward0>)
pos tensor(0.9495, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9642, grad_fn=<MeanBackward0>)
neg tensor(0.9615, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9427, grad_fn=<MeanBackward0>)
neg tensor(0.9378, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9489, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9441, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9483, grad_fn=<MeanBackward0>)
neg tensor(0.9550, grad_fn=<MeanBack

Training:   6%|█████████▏                                                                                                                                                 | 80/1352 [00:19<05:22,  3.95it/s]

neg tensor(0.9548, grad_fn=<MeanBackward0>)
pos tensor(0.9556, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9375, grad_fn=<MeanBackward0>)
neg tensor(0.9673, grad_fn=<MeanBackward0>)
pos tensor(0.9548, grad_fn=<MeanBackward0>)
neg tensor(0.9625, grad_fn=<MeanBackward0>)
pos tensor(0.9441, grad_fn=<MeanBackward0>)
neg tensor(0.9614, grad_fn=<MeanBackward0>)
pos tensor(0.9382, grad_fn=<MeanBackward0>)
neg tensor(0.9587, grad_fn=<MeanBackward0>)
pos tensor(0.9435, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9678, grad_fn=<MeanBackward0>)
pos tensor(0.9454, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9323, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9393, grad_fn=<MeanBackward0>)
neg tensor(0.9662, grad_fn=<Mean

Training:   6%|█████████▎                                                                                                                                                 | 81/1352 [00:20<05:29,  3.85it/s]

neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9507, grad_fn=<MeanBackward0>)
neg tensor(0.9535, grad_fn=<MeanBackward0>)
pos tensor(0.9559, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9389, grad_fn=<MeanBackward0>)
neg tensor(0.9681, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9481, grad_fn=<MeanBackward0>)
neg tensor(0.9649, grad_fn=<MeanBackward0>)
pos tensor(0.9327, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9450, grad_fn=<MeanBackward0>)
neg tensor(0.9532, grad_fn=<MeanBackward0>)
pos tensor(0.9476, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9414, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9453, grad_fn=<MeanBackward0>)
neg tensor(0.9424, grad_fn=<MeanBackward0>)
pos tensor(0.9464, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<Mean

Training:   6%|█████████▍                                                                                                                                                 | 82/1352 [00:20<05:16,  4.02it/s]

neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.9644, grad_fn=<MeanBackward0>)
pos tensor(0.9393, grad_fn=<MeanBackward0>)
neg tensor(0.9557, grad_fn=<MeanBackward0>)
pos tensor(0.9581, grad_fn=<MeanBackward0>)
neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9379, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9438, grad_fn=<MeanBackward0>)
neg tensor(0.9631, grad_fn=<MeanBackward0>)
pos tensor(0.9424, grad_fn=<MeanBackward0>)
neg tensor(0.9630, grad_fn=<MeanBackward0>)
pos tensor(0.9296, grad_fn=<MeanBackward0>)
neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9509, grad_fn=<MeanBackward0>)
neg tensor(0.9254, grad_fn=<MeanBackward0>)
pos tensor(0.9472, grad_fn=<MeanBackward0>)
neg tensor(0.9671, grad_fn=<MeanBackward0>)
pos tensor(0.9542, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<Mean

Training:   6%|█████████▌                                                                                                                                                 | 83/1352 [00:20<05:04,  4.16it/s]

neg tensor(0.9593, grad_fn=<MeanBackward0>)
pos tensor(0.9351, grad_fn=<MeanBackward0>)
neg tensor(0.9702, grad_fn=<MeanBackward0>)
pos tensor(0.9519, grad_fn=<MeanBackward0>)
neg tensor(0.7824, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9276, grad_fn=<MeanBackward0>)
pos tensor(0.9586, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9460, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)
neg tensor(0.9399, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9676, grad_fn=<MeanBackward0>)
pos tensor(0.9502, grad_fn=<MeanBackward0>)
neg tensor(0.9594, grad_fn=<MeanBackward0>)
pos tensor(0.9338, grad_fn=<MeanBackward0>)
neg tensor(0.9655, grad_fn=<MeanBackward0>)
pos tensor(0.9464, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<Mean

Training:   6%|█████████▋                                                                                                                                                 | 84/1352 [00:20<05:18,  3.98it/s]

neg tensor(0.9241, grad_fn=<MeanBackward0>)
pos tensor(0.9401, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9588, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9577, grad_fn=<MeanBackward0>)
neg tensor(0.9579, grad_fn=<MeanBackward0>)
pos tensor(0.9507, grad_fn=<MeanBackward0>)
neg tensor(0.9247, grad_fn=<MeanBackward0>)
pos tensor(0.9516, grad_fn=<MeanBackward0>)
neg tensor(0.9674, grad_fn=<MeanBackward0>)
pos tensor(0.9461, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9577, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9549, grad_fn=<MeanBackward0>)
neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9444, grad_fn=<MeanBackward0>)
neg tensor(0.9667, grad_fn=<MeanBackward0>)
pos tensor(0.9615, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9559, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<Mean

Training:   6%|█████████▋                                                                                                                                                 | 85/1352 [00:21<05:29,  3.85it/s]

neg tensor(0.9671, grad_fn=<MeanBackward0>)
pos tensor(0.9469, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9500, grad_fn=<MeanBackward0>)
neg tensor(0.9322, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9638, grad_fn=<MeanBackward0>)
pos tensor(0.9504, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9425, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<MeanBackward0>)
pos tensor(0.9503, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9554, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9414, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9481, grad_fn=<MeanBackward0>)
neg tensor(0.9682, grad_fn=<MeanBackward0>)
pos tensor(0.9516, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9620, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<Mean

Training:   6%|█████████▊                                                                                                                                                 | 86/1352 [00:21<05:23,  3.91it/s]

neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9478, grad_fn=<MeanBackward0>)
neg tensor(0.9616, grad_fn=<MeanBackward0>)
pos tensor(0.9560, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9415, grad_fn=<MeanBackward0>)
neg tensor(0.9663, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9419, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9528, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9467, grad_fn=<MeanBackward0>)
neg tensor(0.9594, grad_fn=<MeanBackward0>)
pos tensor(0.9554, grad_fn=<MeanBackward0>)
neg tensor(0.9293, grad_fn=<MeanBackward0>)
pos tensor(0.9354, grad_fn=<MeanBackward0>)
neg tensor(0.9665, grad_fn=<MeanBackward0>)
pos tensor(0.9408, grad_fn=<MeanBackward0>)
neg tensor(0.9552, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9622, grad_fn=<Mean

Training:   6%|█████████▉                                                                                                                                                 | 87/1352 [00:21<04:59,  4.23it/s]

neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9406, grad_fn=<MeanBackward0>)
neg tensor(0.9639, grad_fn=<MeanBackward0>)
pos tensor(0.9518, grad_fn=<MeanBackward0>)
neg tensor(0.9559, grad_fn=<MeanBackward0>)
pos tensor(0.9326, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9504, grad_fn=<MeanBackward0>)
neg tensor(0.8884, grad_fn=<MeanBackward0>)
pos tensor(0.9477, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9565, grad_fn=<MeanBackward0>)
neg tensor(0.9699, grad_fn=<MeanBackward0>)
pos tensor(0.9370, grad_fn=<MeanBackward0>)
neg tensor(0.9541, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9599, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9652, grad_fn=<MeanBackward0>)
pos tensor(0.9595, grad_fn=<MeanBackward0>)
neg tensor(0.9638, grad_fn=<MeanBackward0>)
pos tensor(0.9563, grad_fn=<MeanBackward0>)
neg tensor(0.9484, grad_fn=<MeanBack

Training:   7%|██████████                                                                                                                                                 | 88/1352 [00:21<04:54,  4.29it/s]

neg tensor(0.9650, grad_fn=<MeanBackward0>)
pos tensor(0.9367, grad_fn=<MeanBackward0>)
neg tensor(0.9635, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9644, grad_fn=<MeanBackward0>)
pos tensor(0.9652, grad_fn=<MeanBackward0>)
neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9585, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9535, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9592, grad_fn=<MeanBackward0>)
neg tensor(0.9551, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(0.9478, grad_fn=<MeanBackward0>)
neg tensor(0.9711, grad_fn=<MeanBackward0>)
pos tensor(0.9522, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<Mean

Training:   7%|██████████▏                                                                                                                                                | 89/1352 [00:22<04:52,  4.33it/s]

neg tensor(0.9725, grad_fn=<MeanBackward0>)
pos tensor(0.9441, grad_fn=<MeanBackward0>)
neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(0.9547, grad_fn=<MeanBackward0>)
neg tensor(0.9324, grad_fn=<MeanBackward0>)
pos tensor(0.8989, grad_fn=<MeanBackward0>)
neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9385, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9499, grad_fn=<MeanBackward0>)
neg tensor(0.9503, grad_fn=<MeanBackward0>)
pos tensor(0.9567, grad_fn=<MeanBackward0>)
neg tensor(0.9488, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<MeanBackward0>)
pos tensor(0.9480, grad_fn=<MeanBackward0>)
neg tensor(0.9590, grad_fn=<MeanBackward0>)
pos tensor(0.9524, grad_fn=<MeanBackward0>)
neg tensor(0.9620, grad_fn=<MeanBackward0>)
pos tensor(0.9603, grad_fn=<MeanBackward0>)
neg tensor(0.9692, grad_fn=<MeanBackward0>)
pos tensor(0.9568, grad_fn=<MeanBackward0>)
neg tensor(0.9666, grad_fn=<Mean

Training:   7%|██████████▎                                                                                                                                                | 90/1352 [00:22<05:01,  4.19it/s]

neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9445, grad_fn=<MeanBackward0>)
neg tensor(0.9618, grad_fn=<MeanBackward0>)
pos tensor(0.9434, grad_fn=<MeanBackward0>)
neg tensor(0.9708, grad_fn=<MeanBackward0>)
pos tensor(0.9477, grad_fn=<MeanBackward0>)
neg tensor(0.9674, grad_fn=<MeanBackward0>)
pos tensor(0.9519, grad_fn=<MeanBackward0>)
neg tensor(0.9555, grad_fn=<MeanBackward0>)
pos tensor(0.9452, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9531, grad_fn=<MeanBackward0>)
neg tensor(0.9542, grad_fn=<MeanBackward0>)
pos tensor(0.9567, grad_fn=<MeanBackward0>)
neg tensor(0.9469, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9647, grad_fn=<MeanBackward0>)
pos tensor(0.9581, grad_fn=<MeanBackward0>)
neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9532, grad_fn=<MeanBackward0>)
neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9455, grad_fn=<MeanBackward0>)
neg tensor(0.9663, grad_fn=<Mean

Training:   7%|██████████▍                                                                                                                                                | 91/1352 [00:22<05:12,  4.04it/s]

neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(0.9492, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9528, grad_fn=<MeanBackward0>)
neg tensor(0.9755, grad_fn=<MeanBackward0>)
pos tensor(0.9422, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<MeanBackward0>)
pos tensor(0.9458, grad_fn=<MeanBackward0>)
neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9521, grad_fn=<MeanBackward0>)
neg tensor(0.9632, grad_fn=<MeanBackward0>)
pos tensor(0.9567, grad_fn=<MeanBackward0>)
neg tensor(0.9594, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9568, grad_fn=<MeanBackward0>)
pos tensor(0.9454, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9469, grad_fn=<MeanBackward0>)
neg tensor(0.9662, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9689, grad_fn=<MeanBackward0>)
pos tensor(0.9516, grad_fn=<MeanBackward0>)
neg tensor(0.9722, grad_fn=<Mean

Training:   7%|██████████▌                                                                                                                                                | 92/1352 [00:22<05:26,  3.86it/s]

neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9537, grad_fn=<MeanBackward0>)
neg tensor(0.9693, grad_fn=<MeanBackward0>)
pos tensor(0.9457, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9600, grad_fn=<MeanBackward0>)
neg tensor(0.9688, grad_fn=<MeanBackward0>)
pos tensor(0.9395, grad_fn=<MeanBackward0>)
neg tensor(0.9609, grad_fn=<MeanBackward0>)
pos tensor(0.9645, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9486, grad_fn=<MeanBackward0>)
neg tensor(0.9708, grad_fn=<MeanBackward0>)
pos tensor(0.9458, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9460, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9423, grad_fn=<MeanBackward0>)
neg tensor(0.9698, grad_fn=<MeanBackward0>)
pos tensor(0.9400, grad_fn=<MeanBackward0>)
neg tensor(0.8996, grad_fn=<MeanBackward0>)
pos tensor(0.9629, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<Mean

Training:   7%|██████████▋                                                                                                                                                | 93/1352 [00:23<05:20,  3.93it/s]

neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9439, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9549, grad_fn=<MeanBackward0>)
neg tensor(0.9668, grad_fn=<MeanBackward0>)
pos tensor(0.9526, grad_fn=<MeanBackward0>)
neg tensor(0.9575, grad_fn=<MeanBackward0>)
pos tensor(0.9558, grad_fn=<MeanBackward0>)
neg tensor(0.9398, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9532, grad_fn=<MeanBackward0>)
neg tensor(0.9754, grad_fn=<MeanBackward0>)
pos tensor(0.9556, grad_fn=<MeanBackward0>)
neg tensor(0.9366, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(0.9489, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9513, grad_fn=<MeanBackward0>)
neg tensor(0.9641, grad_fn=<Mean

Training:   7%|██████████▊                                                                                                                                                | 94/1352 [00:23<05:21,  3.91it/s]

neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9603, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9518, grad_fn=<MeanBackward0>)
neg tensor(0.9616, grad_fn=<MeanBackward0>)
pos tensor(0.9369, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9563, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBackward0>)
pos tensor(0.9509, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9511, grad_fn=<MeanBackward0>)
pos tensor(0.9547, grad_fn=<MeanBackward0>)
neg tensor(0.9636, grad_fn=<MeanBackward0>)
pos tensor(0.9528, grad_fn=<MeanBackward0>)
neg tensor(0.9666, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9562, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9470, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBac

Training:   7%|██████████▉                                                                                                                                                | 95/1352 [00:23<04:59,  4.20it/s]

neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9534, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9451, grad_fn=<MeanBackward0>)
neg tensor(0.9600, grad_fn=<MeanBackward0>)
pos tensor(0.9738, grad_fn=<MeanBackward0>)
neg tensor(0.9707, grad_fn=<MeanBackward0>)
pos tensor(0.9465, grad_fn=<MeanBackward0>)
neg tensor(0.9618, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9586, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9620, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.9600, grad_fn=<MeanBackward0>)
pos tensor(0.9415, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9454, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<Mean

Training:   7%|███████████                                                                                                                                                | 96/1352 [00:23<04:50,  4.32it/s]

neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9516, grad_fn=<MeanBackward0>)
neg tensor(0.9687, grad_fn=<MeanBackward0>)
pos tensor(0.9586, grad_fn=<MeanBackward0>)
neg tensor(0.9643, grad_fn=<MeanBackward0>)
pos tensor(0.9563, grad_fn=<MeanBackward0>)
neg tensor(0.9336, grad_fn=<MeanBackward0>)
pos tensor(0.9460, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9417, grad_fn=<MeanBackward0>)
neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9502, grad_fn=<MeanBackward0>)
neg tensor(0.9627, grad_fn=<MeanBackward0>)
pos tensor(0.9564, grad_fn=<MeanBackward0>)
neg tensor(0.9351, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9585, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9471, grad_fn=<MeanBackward0>)
neg tensor(0.9622, grad_fn=<MeanBackward0>)
pos tensor(0.9285, grad_fn=<MeanBackward0>)
neg tensor(0.9687, grad_fn=<Mean

Training:   7%|███████████                                                                                                                                                | 97/1352 [00:24<04:42,  4.44it/s]

neg tensor(0.9554, grad_fn=<MeanBackward0>)
pos tensor(0.9336, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)
neg tensor(0.9720, grad_fn=<MeanBackward0>)
pos tensor(0.9542, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9454, grad_fn=<MeanBackward0>)
neg tensor(0.9491, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9389, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9630, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9528, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9544, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9596, grad_fn=<MeanBackward0>)
neg tensor(0.9643, grad_fn=<MeanBackward0>)
pos tensor(0.9424, grad_fn=<MeanBackward0>)
neg tensor(0.9445, grad_fn=<Mean

Training:   7%|███████████▏                                                                                                                                               | 98/1352 [00:24<04:45,  4.39it/s]

neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9483, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(0.9482, grad_fn=<MeanBackward0>)
neg tensor(0.9631, grad_fn=<MeanBackward0>)
pos tensor(0.9412, grad_fn=<MeanBackward0>)
neg tensor(0.9524, grad_fn=<MeanBackward0>)
pos tensor(0.9594, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9614, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9468, grad_fn=<MeanBackward0>)
neg tensor(0.9687, grad_fn=<MeanBackward0>)
pos tensor(0.9594, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(0.9491, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9659, grad_fn=<MeanBackward0>)
pos tensor(0.9470, grad_fn=<MeanBackward0>)
neg tensor(0.9671, grad_fn=<MeanBackward0>)
pos tensor(0.9469, grad_fn=<MeanBackward0>)
neg tensor(0.9591, grad_fn=<Mean

Training:   7%|███████████▎                                                                                                                                               | 99/1352 [00:24<04:37,  4.52it/s]

neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9558, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9502, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9472, grad_fn=<MeanBackward0>)
neg tensor(0.9636, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)
neg tensor(0.9674, grad_fn=<MeanBackward0>)
pos tensor(0.9381, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9595, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9581, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9558, grad_fn=<MeanBackward0>)
pos tensor(0.9569, grad_fn=<MeanBackward0>)
neg tensor(0.9720, grad_fn=<Mean

Training:   7%|███████████▍                                                                                                                                              | 100/1352 [00:24<04:55,  4.24it/s]

neg tensor(0.9588, grad_fn=<MeanBackward0>)
pos tensor(0.9566, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9471, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9492, grad_fn=<MeanBackward0>)
neg tensor(0.9021, grad_fn=<MeanBackward0>)
pos tensor(0.9327, grad_fn=<MeanBackward0>)
neg tensor(0.9611, grad_fn=<MeanBackward0>)
pos tensor(0.9565, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9523, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9586, grad_fn=<MeanBackward0>)
neg tensor(0.9655, grad_fn=<MeanBackward0>)
pos tensor(0.9402, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9546, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<Mean

Training:   7%|███████████▌                                                                                                                                              | 101/1352 [00:25<05:13,  3.99it/s]

neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9526, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9448, grad_fn=<MeanBackward0>)
neg tensor(0.9493, grad_fn=<MeanBackward0>)
pos tensor(0.9458, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9709, grad_fn=<MeanBackward0>)
pos tensor(0.9402, grad_fn=<MeanBackward0>)
neg tensor(0.9707, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9481, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9522, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9536, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<Mean

Training:   8%|███████████▌                                                                                                                                              | 102/1352 [00:25<05:48,  3.58it/s]

neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9495, grad_fn=<MeanBackward0>)
neg tensor(0.9587, grad_fn=<MeanBackward0>)
pos tensor(0.9373, grad_fn=<MeanBackward0>)
neg tensor(0.9498, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9603, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9486, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBackward0>)
pos tensor(0.9605, grad_fn=<MeanBackward0>)
neg tensor(0.9732, grad_fn=<MeanBackward0>)
pos tensor(0.9542, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9520, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9501, grad_fn=<MeanBackward0>)
neg tensor(0.9682, grad_fn=<MeanBackward0>)
pos tensor(0.9372, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9519, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<Mean

Training:   8%|███████████▋                                                                                                                                              | 103/1352 [00:25<05:24,  3.85it/s]

neg tensor(0.9528, grad_fn=<MeanBackward0>)
pos tensor(0.9532, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9488, grad_fn=<MeanBackward0>)
neg tensor(0.3102, grad_fn=<MeanBackward0>)
pos tensor(0.9534, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9551, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9514, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9357, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9585, grad_fn=<MeanBackward0>)
neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9513, grad_fn=<MeanBackward0>)
neg tensor(0.9358, grad_fn=<MeanBackward0>)
pos tensor(0.9583, grad_fn=<MeanBackward0>)
neg tensor(0.8316, grad_fn=<MeanBackward0>)
pos tensor(0.9398, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<Mean

Training:   8%|███████████▊                                                                                                                                              | 104/1352 [00:25<05:21,  3.88it/s]

neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9643, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9508, grad_fn=<MeanBackward0>)
neg tensor(0.9438, grad_fn=<MeanBackward0>)
pos tensor(0.9441, grad_fn=<MeanBackward0>)
neg tensor(0.9686, grad_fn=<MeanBackward0>)
pos tensor(0.9444, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9521, grad_fn=<MeanBackward0>)
neg tensor(0.9642, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9525, grad_fn=<MeanBackward0>)
neg tensor(0.9680, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9600, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBack

Training:   8%|███████████▉                                                                                                                                              | 105/1352 [00:26<05:04,  4.10it/s]

neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9606, grad_fn=<MeanBackward0>)
neg tensor(0.9619, grad_fn=<MeanBackward0>)
pos tensor(0.9378, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9573, grad_fn=<MeanBackward0>)
neg tensor(0.9720, grad_fn=<MeanBackward0>)
pos tensor(0.9546, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9427, grad_fn=<MeanBackward0>)
neg tensor(0.9681, grad_fn=<MeanBackward0>)
pos tensor(0.9406, grad_fn=<MeanBackward0>)
neg tensor(0.9563, grad_fn=<MeanBackward0>)
pos tensor(0.9535, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9625, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9537, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9601, grad_fn=<MeanBackward0>)
neg tensor(0.9545, grad_fn=<MeanBackward0>)
pos tensor(0.9539, grad_fn=<MeanBackward0>)
neg tensor(0.9644, grad_fn=<Mean

Training:   8%|████████████                                                                                                                                              | 106/1352 [00:26<05:14,  3.96it/s]

neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9548, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9754, grad_fn=<MeanBackward0>)
pos tensor(0.9521, grad_fn=<MeanBackward0>)
neg tensor(0.9682, grad_fn=<MeanBackward0>)
pos tensor(0.9471, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<MeanBackward0>)
pos tensor(0.9535, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.4719, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9464, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9511, grad_fn=<MeanBackward0>)
neg tensor(0.9707, grad_fn=<MeanBackward0>)
pos tensor(0.9557, grad_fn=<MeanBackward0>)
neg tensor(0.9693, grad_fn=<Mean

Training:   8%|████████████▏                                                                                                                                             | 107/1352 [00:26<05:27,  3.80it/s]

neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9506, grad_fn=<MeanBackward0>)
neg tensor(0.9660, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(0.9596, grad_fn=<MeanBackward0>)
neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9604, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9525, grad_fn=<MeanBackward0>)
neg tensor(0.9542, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9665, grad_fn=<MeanBackward0>)
pos tensor(0.9427, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9524, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9557, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(0.9539, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<Mean

Training:   8%|████████████▎                                                                                                                                             | 108/1352 [00:26<05:13,  3.97it/s]

neg tensor(0.9611, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9645, grad_fn=<MeanBackward0>)
pos tensor(0.9466, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(0.9551, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9568, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBackward0>)
pos tensor(0.9513, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9533, grad_fn=<MeanBackward0>)
neg tensor(0.9613, grad_fn=<MeanBackward0>)
pos tensor(0.9624, grad_fn=<MeanBackward0>)
neg tensor(0.9685, grad_fn=<MeanBackward0>)
pos tensor(0.9566, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9510, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<Mean

Training:   8%|████████████▍                                                                                                                                             | 109/1352 [00:27<05:07,  4.04it/s]

neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9526, grad_fn=<MeanBackward0>)
neg tensor(0.9496, grad_fn=<MeanBackward0>)
pos tensor(0.9650, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9488, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9544, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9613, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9558, grad_fn=<MeanBackward0>)
neg tensor(0.9660, grad_fn=<MeanBackward0>)
pos tensor(0.9467, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9569, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9531, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<Mean

Training:   8%|████████████▌                                                                                                                                             | 110/1352 [00:27<05:16,  3.93it/s]

neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9559, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9552, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9523, grad_fn=<MeanBackward0>)
neg tensor(0.9571, grad_fn=<MeanBackward0>)
pos tensor(0.9543, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9493, grad_fn=<MeanBackward0>)
neg tensor(0.9683, grad_fn=<MeanBackward0>)
pos tensor(0.9526, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9599, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9633, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9572, grad_fn=<MeanBackward0>)
neg tensor(0.9754, grad_fn=<Mean

Training:   8%|████████████▋                                                                                                                                             | 111/1352 [00:27<05:22,  3.85it/s]

neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9585, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9594, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9600, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9631, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9533, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<MeanBackward0>)
pos tensor(0.9472, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<Mean

Training:   8%|████████████▊                                                                                                                                             | 112/1352 [00:27<05:22,  3.85it/s]

neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9604, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9533, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9588, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9523, grad_fn=<MeanBackward0>)
neg tensor(0.9399, grad_fn=<MeanBackward0>)
pos tensor(0.9467, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9579, grad_fn=<MeanBackward0>)
neg tensor(0.9500, grad_fn=<MeanBackward0>)
pos tensor(0.9550, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.9598, grad_fn=<Mean

Training:   8%|████████████▊                                                                                                                                             | 113/1352 [00:28<05:19,  3.88it/s]

neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9588, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9502, grad_fn=<MeanBackward0>)
neg tensor(0.9755, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9639, grad_fn=<MeanBackward0>)
pos tensor(0.9453, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9596, grad_fn=<MeanBackward0>)
neg tensor(0.9722, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9659, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9643, grad_fn=<MeanBackward0>)
pos tensor(0.9500, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9481, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9531, grad_fn=<MeanBackward0>)
neg tensor(0.9597, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<Mean

Training:   8%|████████████▉                                                                                                                                             | 114/1352 [00:28<05:14,  3.93it/s]

neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9645, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9559, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9576, grad_fn=<MeanBackward0>)
neg tensor(0.9698, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9539, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9590, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.9632, grad_fn=<MeanBackward0>)
pos tensor(0.9653, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9576, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<Mean

Training:   9%|█████████████                                                                                                                                             | 115/1352 [00:28<05:00,  4.11it/s]

neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9501, grad_fn=<MeanBackward0>)
neg tensor(0.9698, grad_fn=<MeanBackward0>)
pos tensor(0.9461, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9564, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9583, grad_fn=<MeanBackward0>)
neg tensor(0.9565, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9647, grad_fn=<MeanBackward0>)
pos tensor(0.9543, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9576, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<MeanBackward0>)
pos tensor(0.9586, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9605, grad_fn=<MeanBackward0>)
neg tensor(0.9638, grad_fn=<MeanBackward0>)
pos tensor(0.9513, grad_fn=<MeanBackward0>)
neg tensor(0.9460, grad_fn=<Mean

Training:   9%|█████████████▏                                                                                                                                            | 116/1352 [00:28<04:55,  4.19it/s]

neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9548, grad_fn=<MeanBackward0>)
neg tensor(0.9599, grad_fn=<MeanBackward0>)
pos tensor(0.9642, grad_fn=<MeanBackward0>)
neg tensor(0.9502, grad_fn=<MeanBackward0>)
pos tensor(0.9628, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9732, grad_fn=<MeanBackward0>)
pos tensor(0.9571, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.5796, grad_fn=<MeanBackward0>)
pos tensor(0.9601, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9624, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9613, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<Mean

Training:   9%|█████████████▎                                                                                                                                            | 117/1352 [00:29<05:05,  4.04it/s]

neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9582, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9614, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9575, grad_fn=<MeanBackward0>)
neg tensor(0.9610, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9541, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9720, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9650, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9612, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<Mean

Training:   9%|█████████████▍                                                                                                                                            | 118/1352 [00:29<04:57,  4.14it/s]

neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9581, grad_fn=<MeanBackward0>)
neg tensor(0.9678, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9472, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9641, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9524, grad_fn=<MeanBackward0>)
neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9586, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9553, grad_fn=<MeanBackward0>)
neg tensor(0.9655, grad_fn=<MeanBackward0>)
pos tensor(0.9564, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9571, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9577, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBack

Training:   9%|█████████████▌                                                                                                                                            | 119/1352 [00:29<04:53,  4.20it/s]

neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9672, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9539, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<MeanBackward0>)
pos tensor(0.9714, grad_fn=<MeanBackward0>)
neg tensor(0.6432, grad_fn=<MeanBackward0>)
pos tensor(0.9545, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9578, grad_fn=<MeanBackward0>)
neg tensor(0.9630, grad_fn=<MeanBackward0>)
pos tensor(0.9570, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9615, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9559, grad_fn=<MeanBackward0>)
neg tensor(0.9658, grad_fn=<Mean

Training:   9%|█████████████▋                                                                                                                                            | 120/1352 [00:29<04:51,  4.22it/s]

neg tensor(0.9676, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9528, grad_fn=<MeanBackward0>)
neg tensor(0.9592, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9611, grad_fn=<MeanBackward0>)
neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9601, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<Mean

Training:   9%|█████████████▊                                                                                                                                            | 121/1352 [00:29<04:44,  4.33it/s]

neg tensor(0.9369, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9580, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9652, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9583, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9590, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9533, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9563, grad_fn=<MeanBackward0>)
pos tensor(0.9520, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9614, grad_fn=<MeanBackward0>)
neg tensor(0.9492, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9711, grad_fn=<Mean

Training:   9%|█████████████▉                                                                                                                                            | 122/1352 [00:30<04:43,  4.35it/s]

neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9598, grad_fn=<MeanBackward0>)
neg tensor(0.9535, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9522, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9633, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9556, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9559, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(0.9637, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9620, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<Mean

Training:   9%|██████████████                                                                                                                                            | 123/1352 [00:30<04:39,  4.40it/s]

neg tensor(0.9679, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9583, grad_fn=<MeanBackward0>)
neg tensor(0.9528, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9754, grad_fn=<MeanBackward0>)
pos tensor(0.9611, grad_fn=<MeanBackward0>)
neg tensor(0.9720, grad_fn=<MeanBackward0>)
pos tensor(0.9595, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9599, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9565, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9704, grad_fn=<MeanBackward0>)
pos tensor(0.9572, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBack

Training:   9%|██████████████                                                                                                                                            | 124/1352 [00:30<04:50,  4.23it/s]

neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9658, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9486, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9612, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9523, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9540, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9714, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9540, grad_fn=<MeanBackward0>)
neg tensor(0.9537, grad_fn=<MeanBackward0>)
pos tensor(0.9559, grad_fn=<MeanBackward0>)
neg tensor(0.9671, grad_fn=<MeanBackward0>)
pos tensor(0.9572, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<Mean

Training:   9%|██████████████▏                                                                                                                                           | 125/1352 [00:30<04:36,  4.43it/s]

neg tensor(0.9446, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9589, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9680, grad_fn=<MeanBackward0>)
pos tensor(0.9703, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9588, grad_fn=<MeanBackward0>)
neg tensor(0.9649, grad_fn=<MeanBackward0>)
pos tensor(0.9599, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9681, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9612, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<Mean

Training:   9%|██████████████▎                                                                                                                                           | 126/1352 [00:31<05:03,  4.03it/s]

neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9611, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9621, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9599, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9564, grad_fn=<MeanBackward0>)
neg tensor(0.9243, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9568, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9652, grad_fn=<MeanBackward0>)
neg tensor(0.9709, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<Mean

Training:   9%|██████████████▍                                                                                                                                           | 127/1352 [00:31<05:07,  3.99it/s]

neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9598, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9588, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9561, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9672, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9662, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9599, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<Mean

Training:   9%|██████████████▌                                                                                                                                           | 128/1352 [00:31<05:14,  3.89it/s]

neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9573, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9512, grad_fn=<MeanBackward0>)
neg tensor(0.9636, grad_fn=<MeanBackward0>)
pos tensor(0.9521, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9572, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<Mean

Training:  10%|██████████████▋                                                                                                                                           | 129/1352 [00:31<05:12,  3.91it/s]

neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9628, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9641, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9517, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9554, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9515, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9620, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9713, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<Mean

Training:  10%|██████████████▊                                                                                                                                           | 130/1352 [00:32<04:58,  4.09it/s]

neg tensor(0.9673, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(0.9623, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9527, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9610, grad_fn=<MeanBackward0>)
neg tensor(0.9674, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9603, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9614, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9708, grad_fn=<Mean

Training:  10%|██████████████▉                                                                                                                                           | 131/1352 [00:32<04:52,  4.17it/s]

neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9603, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9722, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8405, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9566, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<Mean

Training:  10%|███████████████                                                                                                                                           | 132/1352 [00:32<05:01,  4.05it/s]

neg tensor(0.9685, grad_fn=<MeanBackward0>)
pos tensor(0.9562, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9575, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9748, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9630, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9657, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9625, grad_fn=<MeanBackward0>)
neg tensor(0.9705, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<Mean

Training:  10%|███████████████▏                                                                                                                                          | 133/1352 [00:32<05:04,  4.00it/s]

neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9630, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9589, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9600, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9633, grad_fn=<MeanBackward0>)
neg tensor(0.9698, grad_fn=<MeanBackward0>)
pos tensor(0.9654, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9674, grad_fn=<MeanBackward0>)
neg tensor(0.9702, grad_fn=<MeanBackward0>)
pos tensor(0.9598, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9594, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9542, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBack

Training:  10%|███████████████▎                                                                                                                                          | 134/1352 [00:33<05:15,  3.86it/s]

neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9672, grad_fn=<MeanBackward0>)
neg tensor(0.9715, grad_fn=<MeanBackward0>)
pos tensor(0.9629, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9702, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9597, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9693, grad_fn=<MeanBackward0>)
pos tensor(0.9605, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9631, grad_fn=<MeanBackward0>)
neg tensor(0.9713, grad_fn=<MeanBackward0>)
pos tensor(0.9511, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9589, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9613, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<Mean

Training:  10%|███████████████▍                                                                                                                                          | 135/1352 [00:33<05:17,  3.84it/s]

neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9671, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9688, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9564, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9600, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9578, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9580, grad_fn=<MeanBackward0>)
neg tensor(0.9651, grad_fn=<Mean

Training:  10%|███████████████▍                                                                                                                                          | 136/1352 [00:33<04:57,  4.09it/s]

neg tensor(0.9349, grad_fn=<MeanBackward0>)
pos tensor(0.9319, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9582, grad_fn=<MeanBackward0>)
neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9502, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9671, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9599, grad_fn=<MeanBackward0>)
neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.5369, grad_fn=<MeanBackward0>)
pos tensor(0.9541, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9657, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<Mean

Training:  10%|███████████████▌                                                                                                                                          | 137/1352 [00:33<05:01,  4.03it/s]

neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9595, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9699, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9615, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9565, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBackward0>)
pos tensor(0.9716, grad_fn=<MeanBackward0>)
neg tensor(0.9713, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9672, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9662, grad_fn=<MeanBackward0>)
neg tensor(0.6434, grad_fn=<Mean

Training:  10%|███████████████▋                                                                                                                                          | 138/1352 [00:34<05:13,  3.87it/s]

neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9563, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9614, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9599, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9603, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9657, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.8928, grad_fn=<MeanBackward0>)
pos tensor(0.9676, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<Mean

Training:  10%|███████████████▊                                                                                                                                          | 139/1352 [00:34<05:08,  3.93it/s]

neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9659, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9662, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9544, grad_fn=<MeanBackward0>)
neg tensor(0.9614, grad_fn=<MeanBackward0>)
pos tensor(0.9546, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9552, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9621, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<Mean

Training:  10%|███████████████▉                                                                                                                                          | 140/1352 [00:34<04:53,  4.13it/s]

neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9637, grad_fn=<MeanBackward0>)
neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9662, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9385, grad_fn=<MeanBackward0>)
neg tensor(0.9636, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9620, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9229, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.9732, grad_fn=<MeanBack

Training:  10%|████████████████                                                                                                                                          | 141/1352 [00:34<04:54,  4.11it/s]

neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9575, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9611, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9608, grad_fn=<MeanBackward0>)
neg tensor(0.9583, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9582, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<Mean

Training:  11%|████████████████▏                                                                                                                                         | 142/1352 [00:35<05:00,  4.03it/s]

neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9641, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9650, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9634, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9573, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<Mean

Training:  11%|████████████████▎                                                                                                                                         | 143/1352 [00:35<04:48,  4.19it/s]

neg tensor(0.7927, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9647, grad_fn=<MeanBackward0>)
pos tensor(0.9753, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9580, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9650, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9605, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<Mean

Training:  11%|████████████████▍                                                                                                                                         | 144/1352 [00:35<05:06,  3.95it/s]

neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9565, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9667, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9653, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9754, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9645, grad_fn=<MeanBack

Training:  11%|████████████████▌                                                                                                                                         | 145/1352 [00:35<04:50,  4.15it/s]

neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9473, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(-0.1016, grad_fn=<MeanBackward0>)
pos tensor(0.9558, grad_fn=<MeanBackward0>)
neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9655, grad_fn=<Mea

Training:  11%|████████████████▋                                                                                                                                         | 146/1352 [00:36<04:38,  4.32it/s]

neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9650, grad_fn=<MeanBackward0>)
neg tensor(0.9560, grad_fn=<MeanBackward0>)
pos tensor(0.9510, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9645, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9667, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9636, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9569, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<Mean

Training:  11%|████████████████▋                                                                                                                                         | 147/1352 [00:36<04:44,  4.24it/s]

neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9483, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9674, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9611, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9631, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9612, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<Mean

Training:  11%|████████████████▊                                                                                                                                         | 148/1352 [00:36<04:46,  4.20it/s]

neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.9755, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9738, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9688, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<Mean

Training:  11%|████████████████▉                                                                                                                                         | 149/1352 [00:36<04:43,  4.24it/s]

neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9703, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9653, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9654, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9508, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9638, grad_fn=<MeanBackward0>)
pos tensor(0.9468, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<Mean

Training:  11%|█████████████████                                                                                                                                         | 150/1352 [00:37<04:51,  4.13it/s]

neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9641, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(0.9628, grad_fn=<MeanBackward0>)
neg tensor(0.5659, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9720, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9643, grad_fn=<MeanBackward0>)
neg tensor(0.9562, grad_fn=<MeanBackward0>)
pos tensor(0.9403, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9672, grad_fn=<Mean

Training:  11%|█████████████████▏                                                                                                                                        | 151/1352 [00:37<04:58,  4.02it/s]

neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9658, grad_fn=<MeanBackward0>)
neg tensor(0.9713, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9641, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9636, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9667, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9665, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<Mean

Training:  11%|█████████████████▎                                                                                                                                        | 152/1352 [00:37<04:59,  4.01it/s]

neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9590, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9592, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9655, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9665, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9591, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<Mean

Training:  11%|█████████████████▍                                                                                                                                        | 153/1352 [00:37<05:15,  3.79it/s]

neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9553, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9748, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9575, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<Mean

Training:  11%|█████████████████▌                                                                                                                                        | 154/1352 [00:38<05:39,  3.53it/s]

neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9693, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9674, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9583, grad_fn=<MeanBackward0>)
neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9617, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<Mean

Training:  11%|█████████████████▋                                                                                                                                        | 155/1352 [00:38<05:55,  3.37it/s]

neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9580, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9656, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9652, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9676, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<Mean

Training:  12%|█████████████████▊                                                                                                                                        | 156/1352 [00:38<05:30,  3.62it/s]

neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9591, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9592, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9618, grad_fn=<MeanBackward0>)
pos tensor(0.9462, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9685, grad_fn=<MeanBackward0>)
pos tensor(0.9665, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<Mean

Training:  12%|█████████████████▉                                                                                                                                        | 157/1352 [00:39<05:04,  3.92it/s]

neg tensor(0.9699, grad_fn=<MeanBackward0>)
pos tensor(0.9542, grad_fn=<MeanBackward0>)
neg tensor(0.9407, grad_fn=<MeanBackward0>)
pos tensor(0.9643, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9659, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9674, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9555, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<Mean

Training:  12%|█████████████████▉                                                                                                                                        | 158/1352 [00:39<04:34,  4.35it/s]

neg tensor(0.9511, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9368, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.9666, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9293, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9645, grad_fn=<MeanBackward0>)
neg tensor(0.9755, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)


Training:  12%|██████████████████                                                                                                                                        | 159/1352 [00:39<04:35,  4.33it/s]

neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9666, grad_fn=<MeanBackward0>)
neg tensor(0.9683, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.4800, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9732, grad_fn=<MeanBackward0>)
pos tensor(0.9629, grad_fn=<MeanBackward0>)
neg tensor(0.9686, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<Mean

Training:  12%|██████████████████▏                                                                                                                                       | 160/1352 [00:39<04:14,  4.68it/s]

pos tensor(0.9624, grad_fn=<MeanBackward0>)
neg tensor(0.9698, grad_fn=<MeanBackward0>)
pos tensor(0.9603, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9634, grad_fn=<MeanBackward0>)
neg tensor(0.9667, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9685, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)


Training:  12%|██████████████████▎                                                                                                                                       | 161/1352 [00:39<04:33,  4.35it/s]

neg tensor(0.9526, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9629, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9708, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9561, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9655, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<Mean

Training:  12%|██████████████████▍                                                                                                                                       | 162/1352 [00:40<04:54,  4.04it/s]

neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9703, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9658, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9585, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<Mean

Training:  12%|██████████████████▌                                                                                                                                       | 163/1352 [00:40<04:55,  4.03it/s]

neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9479, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9658, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<Mean

Training:  12%|██████████████████▋                                                                                                                                       | 164/1352 [00:40<04:27,  4.44it/s]

neg tensor(0.9533, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.3131, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.5699, grad_fn=<MeanBackward0>)
pos tensor(0.9612, grad_fn=<MeanBackward0>)
neg tensor(0.9489, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)


Training:  12%|██████████████████▊                                                                                                                                       | 165/1352 [00:40<04:36,  4.29it/s]

neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9652, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9645, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9676, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9601, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9620, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<Mean

Training:  12%|██████████████████▉                                                                                                                                       | 166/1352 [00:40<04:15,  4.64it/s]

pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9638, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.8495, grad_fn=<MeanBackward0>)
pos tensor(0.9676, grad_fn=<MeanBackward0>)
neg tensor(0.9702, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9275, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9678, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<Mean

Training:  12%|███████████████████                                                                                                                                       | 167/1352 [00:41<04:14,  4.66it/s]

pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9581, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9709, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9383, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBack

Training:  12%|███████████████████▏                                                                                                                                      | 168/1352 [00:41<04:31,  4.37it/s]

neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9647, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9662, grad_fn=<MeanBackward0>)
neg tensor(0.9113, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<Mean

Training:  12%|███████████████████▎                                                                                                                                      | 169/1352 [00:41<04:34,  4.30it/s]

neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.6925, grad_fn=<MeanBackward0>)
pos tensor(0.9703, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9652, grad_fn=<MeanBackward0>)
neg tensor(0.9505, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9674, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9658, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9642, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9657, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<Mean

Training:  13%|███████████████████▎                                                                                                                                      | 170/1352 [00:41<04:36,  4.27it/s]

neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9652, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9628, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9672, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<Mean

Training:  13%|███████████████████▍                                                                                                                                      | 171/1352 [00:42<04:20,  4.53it/s]

neg tensor(0.9434, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9450, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9570, grad_fn=<MeanBackward0>)
neg tensor(0.9649, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBack

Training:  13%|███████████████████▌                                                                                                                                      | 172/1352 [00:42<04:29,  4.38it/s]

neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<Mean

Training:  13%|███████████████████▋                                                                                                                                      | 173/1352 [00:42<04:18,  4.56it/s]

neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9686, grad_fn=<MeanBackward0>)
pos tensor(0.9614, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9633, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9665, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<Mean

Training:  13%|███████████████████▊                                                                                                                                      | 174/1352 [00:42<04:50,  4.06it/s]

neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9437, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9688, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9642, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9620, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<Mean

Training:  13%|███████████████████▉                                                                                                                                      | 175/1352 [00:43<04:41,  4.19it/s]

neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9585, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9668, grad_fn=<MeanBackward0>)
pos tensor(0.9590, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9656, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBack

Training:  13%|████████████████████                                                                                                                                      | 176/1352 [00:43<04:43,  4.14it/s]

neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9688, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.7496, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<Mean

Training:  13%|████████████████████▏                                                                                                                                     | 177/1352 [00:43<04:30,  4.35it/s]

neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9567, grad_fn=<MeanBackward0>)
pos tensor(0.9676, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9764, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<Mean

Training:  13%|████████████████████▎                                                                                                                                     | 178/1352 [00:43<04:50,  4.04it/s]

neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9716, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9645, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<Mean

Training:  13%|████████████████████▍                                                                                                                                     | 179/1352 [00:44<04:47,  4.08it/s]

neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9621, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9636, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9586, grad_fn=<MeanBackward0>)
pos tensor(0.9565, grad_fn=<MeanBackward0>)
neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.6906, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9652, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<Mean

Training:  13%|████████████████████▌                                                                                                                                     | 180/1352 [00:44<04:43,  4.13it/s]

neg tensor(0.9715, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9656, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9667, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9662, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<Mean

Training:  13%|████████████████████▌                                                                                                                                     | 181/1352 [00:44<04:25,  4.42it/s]

neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9515, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9676, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<Mean

Training:  13%|████████████████████▋                                                                                                                                     | 182/1352 [00:44<05:02,  3.87it/s]

neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9493, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<Mean

Training:  14%|████████████████████▊                                                                                                                                     | 183/1352 [00:45<05:08,  3.79it/s]

neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9707, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9628, grad_fn=<MeanBackward0>)
pos tensor(0.9554, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<Mean

Training:  14%|████████████████████▉                                                                                                                                     | 184/1352 [00:45<05:01,  3.88it/s]

neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9427, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9610, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9171, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9643, grad_fn=<Mean

Training:  14%|█████████████████████                                                                                                                                     | 185/1352 [00:45<05:12,  3.74it/s]

neg tensor(0.9755, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<Mean

Training:  14%|█████████████████████▏                                                                                                                                    | 186/1352 [00:45<05:19,  3.65it/s]

neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9689, grad_fn=<MeanBackward0>)
pos tensor(0.9654, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9617, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<Mean

Training:  14%|█████████████████████▎                                                                                                                                    | 187/1352 [00:46<04:53,  3.97it/s]

neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9286, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9714, grad_fn=<MeanBackward0>)
neg tensor(0.9620, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.9564, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<Mean

Training:  14%|█████████████████████▍                                                                                                                                    | 188/1352 [00:46<04:55,  3.94it/s]

neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9578, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9623, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9711, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<Mean

Training:  14%|█████████████████████▌                                                                                                                                    | 189/1352 [00:46<04:47,  4.05it/s]

neg tensor(0.8932, grad_fn=<MeanBackward0>)
pos tensor(0.9654, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9716, grad_fn=<MeanBackward0>)
neg tensor(0.9720, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9702, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9633, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBack

Training:  14%|█████████████████████▋                                                                                                                                    | 190/1352 [00:46<04:47,  4.04it/s]

neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9074, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9678, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward

Training:  14%|█████████████████████▊                                                                                                                                    | 191/1352 [00:47<04:45,  4.07it/s]

neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9718, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9461, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9371, grad_fn=<MeanBackward0>)
pos tensor(0.9718, grad_fn=<MeanBackward0>)
neg tensor(0.9506, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<Mean

Training:  14%|█████████████████████▊                                                                                                                                    | 192/1352 [00:47<04:41,  4.13it/s]

neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9749, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<Mean

Training:  14%|█████████████████████▉                                                                                                                                    | 193/1352 [00:47<04:37,  4.17it/s]

neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9671, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<Mean

Training:  14%|██████████████████████                                                                                                                                    | 194/1352 [00:47<04:42,  4.09it/s]

neg tensor(0.9553, grad_fn=<MeanBackward0>)
pos tensor(0.9641, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9643, grad_fn=<MeanBackward0>)
pos tensor(0.9656, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<Mean

Training:  14%|██████████████████████▏                                                                                                                                   | 195/1352 [00:48<04:53,  3.94it/s]

neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9714, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9617, grad_fn=<MeanBackward0>)
neg tensor(0.9650, grad_fn=<MeanBackward0>)
pos tensor(0.9403, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9455, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9611, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<Mean

Training:  14%|██████████████████████▎                                                                                                                                   | 196/1352 [00:48<05:10,  3.72it/s]

neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9681, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9650, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<Mean

Training:  15%|██████████████████████▍                                                                                                                                   | 197/1352 [00:48<05:06,  3.76it/s]

neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9582, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(0.9625, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9703, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBack

Training:  15%|██████████████████████▌                                                                                                                                   | 198/1352 [00:48<05:08,  3.74it/s]

neg tensor(0.9395, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9576, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<Mean

Training:  15%|██████████████████████▋                                                                                                                                   | 199/1352 [00:49<05:13,  3.68it/s]

neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9688, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.4383, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<Mean

Training:  15%|██████████████████████▊                                                                                                                                   | 200/1352 [00:49<05:16,  3.64it/s]

neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9698, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBack

Training:  15%|██████████████████████▉                                                                                                                                   | 201/1352 [00:49<05:08,  3.73it/s]

neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9674, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9623, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9753, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<Mean

Training:  15%|███████████████████████                                                                                                                                   | 202/1352 [00:50<05:04,  3.78it/s]

neg tensor(0.9644, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9501, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9738, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<Mean

Training:  15%|███████████████████████                                                                                                                                   | 203/1352 [00:50<04:34,  4.19it/s]

neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9661, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9330, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<Mean

Training:  15%|███████████████████████▏                                                                                                                                  | 204/1352 [00:50<04:38,  4.13it/s]

neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9655, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9764, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<Mean

Training:  15%|███████████████████████▎                                                                                                                                  | 205/1352 [00:50<04:57,  3.86it/s]

neg tensor(0.9665, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9718, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9647, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<Mean

Training:  15%|███████████████████████▍                                                                                                                                  | 206/1352 [00:51<04:57,  3.86it/s]

neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9653, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9753, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<Mean

Training:  15%|███████████████████████▌                                                                                                                                  | 207/1352 [00:51<04:47,  3.99it/s]

neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9552, grad_fn=<MeanBackward0>)
pos tensor(0.9658, grad_fn=<MeanBackward0>)
neg tensor(0.8720, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9753, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9440, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9715, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<Mean

Training:  15%|███████████████████████▋                                                                                                                                  | 208/1352 [00:51<04:33,  4.19it/s]

neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9440, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9676, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9442, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9637, grad_fn=<MeanBackward0>)
pos tensor(0.9560, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<Mean

Training:  15%|███████████████████████▊                                                                                                                                  | 209/1352 [00:51<04:38,  4.11it/s]

neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9764, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9539, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.9626, grad_fn=<MeanBackward0>)
pos tensor(0.9559, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9658, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<Mean

Training:  16%|███████████████████████▉                                                                                                                                  | 210/1352 [00:51<04:34,  4.15it/s]

neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.6596, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9616, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9618, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9711, grad_fn=<MeanBackward0>)
neg tensor(0.3110, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<Mean

Training:  16%|████████████████████████                                                                                                                                  | 211/1352 [00:52<04:19,  4.39it/s]

neg tensor(0.9713, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9654, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9716, grad_fn=<MeanBackward0>)
neg tensor(0.9693, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<Mean

Training:  16%|████████████████████████▏                                                                                                                                 | 212/1352 [00:52<04:42,  4.03it/s]

neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9588, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9715, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<Mean

Training:  16%|████████████████████████▎                                                                                                                                 | 213/1352 [00:52<04:28,  4.24it/s]

neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9749, grad_fn=<MeanBackward0>)
neg tensor(0.9663, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9338, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9683, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9301, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<Mean

Training:  16%|████████████████████████▍                                                                                                                                 | 214/1352 [00:52<04:52,  3.90it/s]

neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9606, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.8007, grad_fn=<Mean

Training:  16%|████████████████████████▍                                                                                                                                 | 215/1352 [00:53<04:45,  3.98it/s]

neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.8031, grad_fn=<MeanBackward0>)
pos tensor(0.9558, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9655, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9764, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9373, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9245, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<Mean

Training:  16%|████████████████████████▌                                                                                                                                 | 216/1352 [00:53<04:46,  3.96it/s]

neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9515, grad_fn=<MeanBackward0>)
neg tensor(0.9616, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9637, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.8256, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBack

Training:  16%|████████████████████████▋                                                                                                                                 | 217/1352 [00:53<04:44,  3.99it/s]

neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9545, grad_fn=<MeanBackward0>)
pos tensor(0.9714, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(0.9625, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9655, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<Mean

Training:  16%|████████████████████████▊                                                                                                                                 | 218/1352 [00:53<04:33,  4.15it/s]

neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9693, grad_fn=<MeanBackward0>)
pos tensor(0.9958, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9671, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.8397, grad_fn=<MeanBackward0>)
pos tensor(0.9572, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.6413, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<MeanBackward0>)
pos tensor(0.9625, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBack

Training:  16%|████████████████████████▉                                                                                                                                 | 219/1352 [00:54<04:15,  4.43it/s]

neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9702, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9715, grad_fn=<MeanBackward0>)
neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9614, grad_fn=<MeanBackward0>)
pos tensor(0.9458, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)


Training:  16%|█████████████████████████                                                                                                                                 | 220/1352 [00:54<04:16,  4.40it/s]

neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9630, grad_fn=<MeanBackward0>)
neg tensor(0.9612, grad_fn=<MeanBackward0>)
pos tensor(0.9942, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9089, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(0.9269, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<Mean

Training:  16%|█████████████████████████▏                                                                                                                                | 221/1352 [00:54<04:26,  4.24it/s]

neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9397, grad_fn=<MeanBackward0>)
pos tensor(0.9623, grad_fn=<MeanBackward0>)
neg tensor(-0.4348, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<Mea

Training:  16%|█████████████████████████▎                                                                                                                                | 222/1352 [00:54<04:42,  4.01it/s]

neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9686, grad_fn=<MeanBackward0>)
pos tensor(0.9407, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9511, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9722, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9556, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<Mean

Training:  16%|█████████████████████████▍                                                                                                                                | 223/1352 [00:55<04:44,  3.96it/s]

neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9625, grad_fn=<MeanBackward0>)
neg tensor(0.9668, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9007, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9553, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<Mean

Training:  17%|█████████████████████████▌                                                                                                                                | 224/1352 [00:55<04:36,  4.07it/s]

neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9748, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9322, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<Mean

Training:  17%|█████████████████████████▋                                                                                                                                | 225/1352 [00:55<04:30,  4.17it/s]

neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9714, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<Mean

Training:  17%|█████████████████████████▋                                                                                                                                | 226/1352 [00:55<04:31,  4.14it/s]

neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9550, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9586, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<Mean

Training:  17%|█████████████████████████▊                                                                                                                                | 227/1352 [00:56<04:33,  4.11it/s]

neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9655, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.7231, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9544, grad_fn=<MeanBackward0>)
neg tensor(0.9422, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<Mean

Training:  17%|█████████████████████████▉                                                                                                                                | 228/1352 [00:56<04:35,  4.08it/s]

neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9704, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9294, grad_fn=<MeanBackward0>)
neg tensor(0.7408, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<Mean

Training:  17%|██████████████████████████                                                                                                                                | 229/1352 [00:56<04:27,  4.20it/s]

neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9711, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9613, grad_fn=<MeanBackward0>)
pos tensor(0.9379, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<Mean

Training:  17%|██████████████████████████▏                                                                                                                               | 230/1352 [00:56<04:44,  3.94it/s]

neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.8282, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9648, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9749, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<Mean

Training:  17%|██████████████████████████▎                                                                                                                               | 231/1352 [00:57<04:52,  3.83it/s]

neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.8990, grad_fn=<Mean

Training:  17%|██████████████████████████▍                                                                                                                               | 232/1352 [00:57<04:40,  4.00it/s]

neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9560, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<Mean

Training:  17%|██████████████████████████▌                                                                                                                               | 233/1352 [00:57<04:45,  3.92it/s]

neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9388, grad_fn=<MeanBackward0>)
neg tensor(0.9402, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<Mean

Training:  17%|██████████████████████████▋                                                                                                                               | 234/1352 [00:57<04:36,  4.04it/s]

neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9634, grad_fn=<MeanBackward0>)
neg tensor(0.9389, grad_fn=<Mean

Training:  17%|██████████████████████████▊                                                                                                                               | 235/1352 [00:58<04:19,  4.30it/s]

neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9738, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<Mean

Training:  17%|██████████████████████████▉                                                                                                                               | 236/1352 [00:58<04:25,  4.21it/s]

neg tensor(0.9631, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9668, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9560, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<Mean

Training:  18%|██████████████████████████▉                                                                                                                               | 237/1352 [00:58<04:08,  4.49it/s]

neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9688, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<Mean

Training:  18%|███████████████████████████                                                                                                                               | 238/1352 [00:58<04:08,  4.49it/s]

neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.7382, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9819, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<Mean

Training:  18%|███████████████████████████▏                                                                                                                              | 239/1352 [00:58<04:12,  4.40it/s]

neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9748, grad_fn=<MeanBackward0>)
neg tensor(0.9369, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9647, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.8831, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(-0.0152, grad_fn=<MeanBac

Training:  18%|███████████████████████████▎                                                                                                                              | 240/1352 [00:59<04:08,  4.48it/s]

neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9659, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBack

Training:  18%|███████████████████████████▍                                                                                                                              | 241/1352 [00:59<04:14,  4.37it/s]

neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9673, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<Mean

Training:  18%|███████████████████████████▌                                                                                                                              | 242/1352 [00:59<04:06,  4.50it/s]

neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<Mean

Training:  18%|███████████████████████████▋                                                                                                                              | 243/1352 [00:59<04:35,  4.02it/s]

neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9711, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<Mean

Training:  18%|███████████████████████████▊                                                                                                                              | 244/1352 [01:00<04:28,  4.13it/s]

neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9685, grad_fn=<MeanBackward0>)
pos tensor(0.9519, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<Mean

Training:  18%|███████████████████████████▉                                                                                                                              | 245/1352 [01:00<04:22,  4.22it/s]

neg tensor(0.9307, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBackward0>)
pos tensor(0.9674, grad_fn=<MeanBackward0>)
neg tensor(0.9548, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9535, grad_fn=<MeanBackward0>)
pos tensor(0.9721, grad_fn=<MeanBackward0>)
neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9714, grad_fn=<MeanBackward0>)
neg tensor(0.9754, grad_fn=<MeanBackward0>)
pos tensor(0.9658, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBack

Training:  18%|████████████████████████████                                                                                                                              | 246/1352 [01:00<04:31,  4.08it/s]

neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.8630, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9715, grad_fn=<MeanBackward0>)
neg tensor(0.7235, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<Mean

Training:  18%|████████████████████████████▏                                                                                                                             | 247/1352 [01:00<04:18,  4.27it/s]

neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9615, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9715, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9754, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<Mean

Training:  18%|████████████████████████████▏                                                                                                                             | 248/1352 [01:01<04:18,  4.27it/s]

neg tensor(0.8072, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9394, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.3583, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9653, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<Mean

Training:  18%|████████████████████████████▎                                                                                                                             | 249/1352 [01:01<04:12,  4.38it/s]

neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9549, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9749, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<Mean

Training:  18%|████████████████████████████▍                                                                                                                             | 250/1352 [01:01<04:09,  4.41it/s]

neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9193, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9643, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<Mean

Training:  19%|████████████████████████████▌                                                                                                                             | 251/1352 [01:01<04:05,  4.49it/s]

neg tensor(0.8974, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9528, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9662, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9653, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9689, grad_fn=<MeanBackward0>)
pos tensor(0.9560, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9575, grad_fn=<MeanBackward0>)
pos tensor(0.9339, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBack

Training:  19%|████████████████████████████▋                                                                                                                             | 252/1352 [01:01<03:53,  4.70it/s]

neg tensor(0.9698, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9628, grad_fn=<MeanBackward0>)
neg tensor(0.9601, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)


Training:  19%|████████████████████████████▊                                                                                                                             | 253/1352 [01:02<04:03,  4.50it/s]

neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9666, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9662, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9748, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9299, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.7671, grad_fn=<Mean

Training:  19%|████████████████████████████▉                                                                                                                             | 254/1352 [01:02<04:09,  4.41it/s]

neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9625, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9638, grad_fn=<MeanBackward0>)
pos tensor(0.9642, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9661, grad_fn=<MeanBackward0>)
neg tensor(0.9672, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9690, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBack

Training:  19%|█████████████████████████████                                                                                                                             | 255/1352 [01:02<04:15,  4.30it/s]

neg tensor(0.8411, grad_fn=<MeanBackward0>)
pos tensor(0.9749, grad_fn=<MeanBackward0>)
neg tensor(0.9588, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9643, grad_fn=<MeanBackward0>)
pos tensor(0.9517, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.8194, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<Mean

Training:  19%|█████████████████████████████▏                                                                                                                            | 256/1352 [01:02<04:12,  4.34it/s]

neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9673, grad_fn=<MeanBackward0>)
pos tensor(0.9543, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9583, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<Mean

Training:  19%|█████████████████████████████▎                                                                                                                            | 257/1352 [01:03<04:09,  4.38it/s]

neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9630, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.8607, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9630, grad_fn=<MeanBack

Training:  19%|█████████████████████████████▍                                                                                                                            | 258/1352 [01:03<04:08,  4.40it/s]

neg tensor(0.9662, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9632, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9600, grad_fn=<MeanBackward0>)
pos tensor(0.9641, grad_fn=<MeanBackward0>)
neg tensor(0.9253, grad_fn=<MeanBackward0>)
pos tensor(0.9550, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9521, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBack

Training:  19%|█████████████████████████████▌                                                                                                                            | 259/1352 [01:03<04:12,  4.32it/s]

neg tensor(0.4820, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9656, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9665, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9613, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<Mean

Training:  19%|█████████████████████████████▌                                                                                                                            | 260/1352 [01:03<04:20,  4.19it/s]

neg tensor(0.9523, grad_fn=<MeanBackward0>)
pos tensor(0.9461, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9718, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9500, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9434, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<Mean

Training:  19%|█████████████████████████████▋                                                                                                                            | 261/1352 [01:04<04:08,  4.39it/s]

neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9493, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9685, grad_fn=<MeanBackward0>)
pos tensor(0.9583, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<Mean

Training:  19%|█████████████████████████████▊                                                                                                                            | 262/1352 [01:04<04:13,  4.30it/s]

neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9753, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9690, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.6186, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<Mean

Training:  19%|█████████████████████████████▉                                                                                                                            | 263/1352 [01:04<04:25,  4.10it/s]

neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9665, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9705, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9678, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.8355, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<Mean

Training:  20%|██████████████████████████████                                                                                                                            | 264/1352 [01:04<04:31,  4.01it/s]

neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.8988, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9484, grad_fn=<MeanBackward0>)
pos tensor(0.9596, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9607, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9657, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<Mean

Training:  20%|██████████████████████████████▏                                                                                                                           | 265/1352 [01:04<04:14,  4.28it/s]

neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9707, grad_fn=<MeanBackward0>)
neg tensor(0.9508, grad_fn=<Mean

Training:  20%|██████████████████████████████▎                                                                                                                           | 266/1352 [01:05<04:24,  4.10it/s]

neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9590, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9640, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9402, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBack

Training:  20%|██████████████████████████████▍                                                                                                                           | 267/1352 [01:05<04:20,  4.17it/s]

neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9597, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9497, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9435, grad_fn=<MeanBackward0>)
neg tensor(0.9611, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9528, grad_fn=<MeanBackward0>)
pos tensor(0.9389, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9660, grad_fn=<MeanBackward0>)
neg tensor(0.8057, grad_fn=<MeanBackward0>)
pos tensor(0.9529, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<Mean

Training:  20%|██████████████████████████████▌                                                                                                                           | 268/1352 [01:05<04:08,  4.37it/s]

neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9611, grad_fn=<MeanBackward0>)
neg tensor(0.4826, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.8981, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9593, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.9711, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<Mean

Training:  20%|██████████████████████████████▋                                                                                                                           | 269/1352 [01:05<04:04,  4.42it/s]

neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.7324, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9654, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9699, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9498, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9612, grad_fn=<Mean

Training:  20%|██████████████████████████████▊                                                                                                                           | 270/1352 [01:06<04:26,  4.06it/s]

neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9689, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9529, grad_fn=<MeanBackward0>)
pos tensor(0.9293, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9673, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9630, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<Mean

Training:  20%|██████████████████████████████▊                                                                                                                           | 271/1352 [01:06<05:04,  3.55it/s]

neg tensor(0.9587, grad_fn=<MeanBackward0>)
pos tensor(0.9595, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9513, grad_fn=<MeanBackward0>)
pos tensor(0.9576, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<Mean

Training:  20%|██████████████████████████████▉                                                                                                                           | 272/1352 [01:06<04:55,  3.66it/s]

neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9662, grad_fn=<MeanBackward0>)
pos tensor(0.9571, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9692, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9171, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<Mean

Training:  20%|███████████████████████████████                                                                                                                           | 273/1352 [01:07<04:52,  3.68it/s]

neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9526, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9627, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<Mean

Training:  20%|███████████████████████████████▏                                                                                                                          | 274/1352 [01:07<04:53,  3.67it/s]

neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9714, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9718, grad_fn=<MeanBackward0>)
pos tensor(0.9633, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.5770, grad_fn=<MeanBackward0>)
pos tensor(0.9583, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<Mean

Training:  20%|███████████████████████████████▎                                                                                                                          | 275/1352 [01:07<04:32,  3.96it/s]

neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9949, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9413, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBack

Training:  20%|███████████████████████████████▍                                                                                                                          | 276/1352 [01:07<04:30,  3.97it/s]

neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9575, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.5909, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<Mean

Training:  20%|███████████████████████████████▌                                                                                                                          | 277/1352 [01:08<04:19,  4.14it/s]

neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9733, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBack

Training:  21%|███████████████████████████████▋                                                                                                                          | 278/1352 [01:08<04:33,  3.92it/s]

neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9609, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBack

Training:  21%|███████████████████████████████▊                                                                                                                          | 279/1352 [01:08<04:18,  4.15it/s]

neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.5735, grad_fn=<MeanBackward0>)
pos tensor(0.9570, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8892, grad_fn=<MeanBackward0>)
pos tensor(0.9038, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<Mean

Training:  21%|███████████████████████████████▉                                                                                                                          | 280/1352 [01:08<04:09,  4.30it/s]

neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9473, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.7853, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9402, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(-0.0098, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9686, grad_fn=<MeanBackward0>)
pos tensor(0.9672, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<Mea

Training:  21%|████████████████████████████████                                                                                                                          | 281/1352 [01:08<04:10,  4.28it/s]

neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9260, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9617, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9748, grad_fn=<MeanBackward0>)
neg tensor(0.7948, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<Mean

Training:  21%|████████████████████████████████                                                                                                                          | 282/1352 [01:09<04:00,  4.45it/s]

neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9486, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9533, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9600, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<Mean

Training:  21%|████████████████████████████████▎                                                                                                                         | 284/1352 [01:09<03:25,  5.20it/s]

neg tensor(0.9279, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9436, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9686, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9617, grad_fn=<MeanBackward0>)
neg tensor(0.9541, grad_fn=<MeanBackward0>)
pos tensor(0.9466, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9688, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<Mean

Training:  21%|████████████████████████████████▍                                                                                                                         | 285/1352 [01:09<03:31,  5.05it/s]

tensor(0.8543, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9594, grad_fn=<MeanBackward0>)
pos tensor(0.9485, grad_fn=<MeanBackward0>)
neg tensor(0.8359, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9681, grad_fn=<MeanBackward

Training:  21%|████████████████████████████████▌                                                                                                                         | 286/1352 [01:09<03:38,  4.87it/s]

neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.8746, grad_fn=<MeanBackward0>)
pos tensor(0.8581, grad_fn=<MeanBackward0>)
neg tensor(0.9645, grad_fn=<MeanBackward0>)
pos tensor(0.9649, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9072, grad_fn=<MeanBackward0>)
pos tensor(0.9594, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9650, grad_fn=<MeanBackward0>)
neg tensor(0.9634, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9569, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBack

Training:  21%|████████████████████████████████▋                                                                                                                         | 287/1352 [01:10<03:54,  4.54it/s]

neg tensor(0.9521, grad_fn=<MeanBackward0>)
pos tensor(0.9565, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9643, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(0.9749, grad_fn=<MeanBackward0>)
neg tensor(0.9655, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9718, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9683, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9483, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9659, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<Mean

Training:  21%|████████████████████████████████▊                                                                                                                         | 288/1352 [01:10<03:53,  4.57it/s]

neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9569, grad_fn=<MeanBackward0>)
neg tensor(0.9596, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9635, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9625, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9458, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9516, grad_fn=<MeanBackward0>)
pos tensor(0.9488, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.9456, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9480, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9610, grad_fn=<Mean

Training:  21%|████████████████████████████████▉                                                                                                                         | 289/1352 [01:10<03:59,  4.44it/s]

neg tensor(0.8937, grad_fn=<MeanBackward0>)
pos tensor(0.9484, grad_fn=<MeanBackward0>)
neg tensor(0.9705, grad_fn=<MeanBackward0>)
pos tensor(0.9514, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9577, grad_fn=<MeanBackward0>)
neg tensor(0.8145, grad_fn=<MeanBackward0>)
pos tensor(0.9006, grad_fn=<MeanBackward0>)
neg tensor(0.9707, grad_fn=<MeanBackward0>)
pos tensor(0.9514, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9674, grad_fn=<MeanBackward0>)
pos tensor(0.9613, grad_fn=<MeanBackward0>)
neg tensor(0.9592, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9490, grad_fn=<MeanBackward0>)
pos tensor(0.9118, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<Mean

Training:  21%|█████████████████████████████████                                                                                                                         | 290/1352 [01:10<04:08,  4.27it/s]

neg tensor(0.9534, grad_fn=<MeanBackward0>)
pos tensor(0.9629, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9732, grad_fn=<MeanBackward0>)
pos tensor(0.9633, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9724, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9635, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9417, grad_fn=<MeanBackward0>)
neg tensor(0.9300, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<Mean

Training:  22%|█████████████████████████████████▏                                                                                                                        | 291/1352 [01:11<04:03,  4.36it/s]

neg tensor(0.9651, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9018, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9482, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9704, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9176, grad_fn=<MeanBackward0>)
pos tensor(0.9442, grad_fn=<MeanBackward0>)
neg tensor(0.9504, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.8298, grad_fn=<MeanBack

Training:  22%|█████████████████████████████████▎                                                                                                                        | 292/1352 [01:11<04:00,  4.40it/s]

neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9600, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9636, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9686, grad_fn=<MeanBack

Training:  22%|█████████████████████████████████▎                                                                                                                        | 293/1352 [01:11<03:48,  4.64it/s]

neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9495, grad_fn=<MeanBackward0>)
pos tensor(0.9454, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9643, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)


Training:  22%|█████████████████████████████████▍                                                                                                                        | 294/1352 [01:11<03:58,  4.44it/s]

neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9164, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9626, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9315, grad_fn=<Mean

Training:  22%|█████████████████████████████████▌                                                                                                                        | 295/1352 [01:11<04:00,  4.40it/s]

neg tensor(0.9710, grad_fn=<MeanBackward0>)
pos tensor(0.9695, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9600, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.8990, grad_fn=<MeanBackward0>)
pos tensor(0.9066, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9534, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9651, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<Mean

Training:  22%|█████████████████████████████████▋                                                                                                                        | 296/1352 [01:12<04:19,  4.08it/s]

neg tensor(0.9667, grad_fn=<MeanBackward0>)
pos tensor(0.9645, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.8593, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9435, grad_fn=<MeanBackward0>)
pos tensor(0.9500, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<Mean

Training:  22%|█████████████████████████████████▊                                                                                                                        | 297/1352 [01:12<04:11,  4.19it/s]

neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9631, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9318, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9528, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9764, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.8774, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<Mean

Training:  22%|█████████████████████████████████▉                                                                                                                        | 298/1352 [01:12<04:19,  4.07it/s]

neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9345, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<Mean

Training:  22%|██████████████████████████████████                                                                                                                        | 299/1352 [01:12<04:03,  4.32it/s]

neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.4754, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.8829, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9456, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.8405, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBackwar

Training:  22%|██████████████████████████████████▏                                                                                                                       | 300/1352 [01:13<03:51,  4.54it/s]

neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9701, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9624, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9559, grad_fn=<MeanBackward0>)
pos tensor(0.9539, grad_fn=<MeanBackward0>)
neg tensor(0.9509, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9680, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)


Training:  22%|██████████████████████████████████▎                                                                                                                       | 301/1352 [01:13<03:49,  4.58it/s]

neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9611, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.8041, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9443, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<Mean

Training:  22%|██████████████████████████████████▍                                                                                                                       | 302/1352 [01:13<03:38,  4.80it/s]

neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9303, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg 

Training:  22%|██████████████████████████████████▌                                                                                                                       | 303/1352 [01:13<03:41,  4.73it/s]

tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9685, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBack

Training:  22%|██████████████████████████████████▋                                                                                                                       | 304/1352 [01:14<03:46,  4.63it/s]

neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9704, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9377, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9502, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9427, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9155, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<Mean

Training:  23%|██████████████████████████████████▋                                                                                                                       | 305/1352 [01:14<04:07,  4.23it/s]

neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9782, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<Mean

Training:  23%|██████████████████████████████████▊                                                                                                                       | 306/1352 [01:14<04:21,  4.00it/s]

neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.8004, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9735, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9715, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9674, grad_fn=<Mean

Training:  23%|██████████████████████████████████▉                                                                                                                       | 307/1352 [01:14<04:23,  3.96it/s]

neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9654, grad_fn=<MeanBackward0>)
pos tensor(0.9474, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9543, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9570, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.7351, grad_fn=<MeanBackward0>)
pos tensor(0.6238, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9780, grad_fn=<MeanBackward0>)
neg tensor(0.9701, grad_fn=<Mean

Training:  23%|███████████████████████████████████                                                                                                                       | 308/1352 [01:15<04:17,  4.06it/s]

neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.5822, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9136, grad_fn=<MeanBackward0>)
pos tensor(0.9333, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.8524, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9607, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBack

Training:  23%|███████████████████████████████████▏                                                                                                                      | 309/1352 [01:15<04:23,  3.96it/s]

neg tensor(0.8413, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.8751, grad_fn=<MeanBackward0>)
pos tensor(0.9682, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.8824, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9552, grad_fn=<MeanBackward0>)
neg tensor(0.9640, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBack

Training:  23%|███████████████████████████████████▎                                                                                                                      | 310/1352 [01:15<04:44,  3.66it/s]

neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9819, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<Mean

Training:  23%|███████████████████████████████████▍                                                                                                                      | 311/1352 [01:15<04:59,  3.48it/s]

neg tensor(0.9625, grad_fn=<MeanBackward0>)
pos tensor(0.9337, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9373, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.8311, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.7531, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<Mean

Training:  23%|███████████████████████████████████▌                                                                                                                      | 312/1352 [01:16<04:43,  3.67it/s]

neg tensor(0.9709, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.8337, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.8022, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9753, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9438, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward

Training:  23%|███████████████████████████████████▋                                                                                                                      | 313/1352 [01:16<04:37,  3.75it/s]

neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9619, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9614, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9504, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9749, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<Mean

Training:  23%|███████████████████████████████████▊                                                                                                                      | 314/1352 [01:16<04:45,  3.64it/s]

neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<Mean

Training:  23%|███████████████████████████████████▉                                                                                                                      | 315/1352 [01:17<05:03,  3.42it/s]

neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9819, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9502, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<Mean

Training:  23%|███████████████████████████████████▉                                                                                                                      | 316/1352 [01:17<04:51,  3.55it/s]

neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.8211, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<Mean

Training:  23%|████████████████████████████████████                                                                                                                      | 317/1352 [01:17<04:42,  3.67it/s]

neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9947, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9819, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<Mean

Training:  24%|████████████████████████████████████▏                                                                                                                     | 318/1352 [01:17<04:27,  3.87it/s]

neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9625, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.8831, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<Mean

Training:  24%|████████████████████████████████████▎                                                                                                                     | 319/1352 [01:18<04:20,  3.97it/s]

neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.8722, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBack

Training:  24%|████████████████████████████████████▍                                                                                                                     | 320/1352 [01:18<04:02,  4.26it/s]

neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9039, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9376, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.7031, grad_fn=<MeanBack

Training:  24%|████████████████████████████████████▌                                                                                                                     | 321/1352 [01:18<03:55,  4.38it/s]

neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9062, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<Mean

Training:  24%|████████████████████████████████████▋                                                                                                                     | 322/1352 [01:18<03:55,  4.38it/s]

neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9442, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9438, grad_fn=<MeanBackward0>)
pos tensor(0.9617, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.6904, grad_fn=<Mean

Training:  24%|████████████████████████████████████▊                                                                                                                     | 323/1352 [01:18<03:55,  4.37it/s]

neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9647, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9819, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9223, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9588, grad_fn=<MeanBackward0>)
neg tensor(0.9480, grad_fn=<MeanBackward0>)
pos tensor(0.9612, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<Mean

Training:  24%|████████████████████████████████████▉                                                                                                                     | 324/1352 [01:19<03:51,  4.45it/s]

neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.6130, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.9396, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9513, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9672, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<Mean

Training:  24%|█████████████████████████████████████                                                                                                                     | 325/1352 [01:19<03:59,  4.29it/s]

neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9601, grad_fn=<MeanBackward0>)
pos tensor(0.9565, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<Mean

Training:  24%|█████████████████████████████████████▏                                                                                                                    | 326/1352 [01:19<04:11,  4.09it/s]

neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9590, grad_fn=<MeanBackward0>)
neg tensor(0.9496, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9690, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.4788, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9403, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<Mean

Training:  24%|█████████████████████████████████████▏                                                                                                                    | 327/1352 [01:19<04:08,  4.13it/s]

neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9667, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9548, grad_fn=<MeanBackward0>)
pos tensor(0.9545, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9755, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9183, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<Mean

Training:  24%|█████████████████████████████████████▎                                                                                                                    | 328/1352 [01:20<04:12,  4.05it/s]

neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9387, grad_fn=<MeanBackward0>)
pos tensor(0.9451, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9337, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9309, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9755, grad_fn=<MeanBack

Training:  24%|█████████████████████████████████████▍                                                                                                                    | 329/1352 [01:20<04:01,  4.24it/s]

neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9703, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9542, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<Mean

Training:  24%|█████████████████████████████████████▌                                                                                                                    | 330/1352 [01:20<03:55,  4.34it/s]

neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.5289, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9638, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9764, grad_fn=<MeanBackward0>)
neg tensor(0.9753, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBack

Training:  24%|█████████████████████████████████████▋                                                                                                                    | 331/1352 [01:20<03:52,  4.40it/s]

neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(0.9942, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.9328, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<Mean

Training:  25%|█████████████████████████████████████▊                                                                                                                    | 332/1352 [01:21<03:42,  4.58it/s]

neg tensor(0.8126, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9841, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9018, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9666, grad_fn=<MeanBackward0>)
pos tensor(0.9579, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<Mean

Training:  25%|█████████████████████████████████████▉                                                                                                                    | 333/1352 [01:21<03:44,  4.54it/s]

neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9711, grad_fn=<MeanBackward0>)
neg tensor(0.9498, grad_fn=<MeanBackward0>)
pos tensor(0.9589, grad_fn=<MeanBackward0>)
neg tensor(0.9597, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9449, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9558, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9668, grad_fn=<Mean

Training:  25%|██████████████████████████████████████                                                                                                                    | 334/1352 [01:21<03:49,  4.44it/s]

neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9682, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9747, grad_fn=<MeanBackward0>)
neg tensor(0.9618, grad_fn=<MeanBackward0>)
pos tensor(0.9224, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.8985, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.7170, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9230, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9622, grad_fn=<Mean

Training:  25%|██████████████████████████████████████▏                                                                                                                   | 335/1352 [01:21<03:48,  4.44it/s]

neg tensor(0.9604, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9644, grad_fn=<MeanBackward0>)
neg tensor(0.9409, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9592, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9458, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<Mean

Training:  25%|██████████████████████████████████████▎                                                                                                                   | 336/1352 [01:21<03:57,  4.27it/s]

neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9575, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9758, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9646, grad_fn=<MeanBackward0>)
neg tensor(0.9669, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9755, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBack

Training:  25%|██████████████████████████████████████▍                                                                                                                   | 337/1352 [01:22<04:15,  3.97it/s]

neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.8253, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9596, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9614, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9569, grad_fn=<MeanBackward0>)
neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<Mean

Training:  25%|██████████████████████████████████████▌                                                                                                                   | 338/1352 [01:22<04:28,  3.77it/s]

neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9563, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9494, grad_fn=<MeanBackward0>)
neg tensor(0.9732, grad_fn=<MeanBackward0>)
pos tensor(0.9560, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9750, grad_fn=<MeanBackward0>)
pos tensor(0.9550, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<Mean

Training:  25%|██████████████████████████████████████▌                                                                                                                   | 339/1352 [01:22<04:38,  3.64it/s]

neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9427, grad_fn=<MeanBackward0>)
pos tensor(0.9315, grad_fn=<MeanBackward0>)
neg tensor(0.9552, grad_fn=<MeanBackward0>)
pos tensor(0.9645, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9619, grad_fn=<MeanBackward0>)
neg tensor(0.8899, grad_fn=<MeanBackward0>)
pos tensor(0.9371, grad_fn=<MeanBackward0>)
neg tensor(0.9654, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9585, grad_fn=<MeanBackward0>)
neg tensor(0.9174, grad_fn=<MeanBackward0>)
pos tensor(0.9693, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBack

Training:  25%|██████████████████████████████████████▋                                                                                                                   | 340/1352 [01:23<04:27,  3.79it/s]

neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.2981, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.8525, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9532, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<Mean

Training:  25%|██████████████████████████████████████▊                                                                                                                   | 341/1352 [01:23<04:16,  3.94it/s]

neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9628, grad_fn=<MeanBackward0>)
pos tensor(0.9582, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9629, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9284, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.8904, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9547, grad_fn=<Mean

Training:  25%|██████████████████████████████████████▉                                                                                                                   | 342/1352 [01:23<04:16,  3.94it/s]

neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9699, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9740, grad_fn=<MeanBackward0>)
pos tensor(0.9690, grad_fn=<MeanBackward0>)
neg tensor(0.7594, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9102, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.8300, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<Mean

Training:  25%|███████████████████████████████████████                                                                                                                   | 343/1352 [01:23<04:10,  4.02it/s]

neg tensor(0.9681, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.8641, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9424, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9718, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9673, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9689, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9298, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9759, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<Mean

Training:  25%|███████████████████████████████████████▏                                                                                                                  | 344/1352 [01:24<04:09,  4.03it/s]

neg tensor(0.8237, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.7531, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9609, grad_fn=<MeanBackward0>)
pos tensor(0.9528, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9418, grad_fn=<Mean

Training:  26%|███████████████████████████████████████▎                                                                                                                  | 345/1352 [01:24<04:11,  4.00it/s]

neg tensor(0.9732, grad_fn=<MeanBackward0>)
pos tensor(0.9552, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9255, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9514, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9301, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBack

Training:  26%|███████████████████████████████████████▍                                                                                                                  | 346/1352 [01:24<04:15,  3.94it/s]

neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.8919, grad_fn=<MeanBackward0>)
pos tensor(0.9579, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9651, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9692, grad_fn=<MeanBackward0>)
pos tensor(0.9467, grad_fn=<MeanBackward0>)
neg tensor(0.9472, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9462, grad_fn=<Mean

Training:  26%|███████████████████████████████████████▌                                                                                                                  | 347/1352 [01:24<04:09,  4.03it/s]

neg tensor(0.4822, grad_fn=<MeanBackward0>)
pos tensor(0.9639, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9841, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9704, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9615, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<Mean

Training:  26%|███████████████████████████████████████▋                                                                                                                  | 348/1352 [01:25<04:15,  3.93it/s]

neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9637, grad_fn=<MeanBackward0>)
neg tensor(0.7431, grad_fn=<MeanBackward0>)
pos tensor(0.9624, grad_fn=<MeanBackward0>)
neg tensor(0.8771, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<Mean

Training:  26%|███████████████████████████████████████▊                                                                                                                  | 349/1352 [01:25<04:07,  4.05it/s]

neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9370, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.8619, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.3831, grad_fn=<MeanBack

Training:  26%|███████████████████████████████████████▊                                                                                                                  | 350/1352 [01:25<04:16,  3.91it/s]

neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9415, grad_fn=<MeanBackward0>)
pos tensor(0.9555, grad_fn=<MeanBackward0>)
neg tensor(0.9720, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9688, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<Mean

Training:  26%|███████████████████████████████████████▉                                                                                                                  | 351/1352 [01:25<04:14,  3.93it/s]

neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9581, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<Mean

Training:  26%|████████████████████████████████████████                                                                                                                  | 352/1352 [01:26<04:11,  3.97it/s]

neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.8294, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9529, grad_fn=<Mean

Training:  26%|████████████████████████████████████████▏                                                                                                                 | 353/1352 [01:26<04:02,  4.12it/s]

neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9017, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.7972, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<Mean

Training:  26%|████████████████████████████████████████▎                                                                                                                 | 354/1352 [01:26<04:04,  4.08it/s]

neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.8011, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<Mean

Training:  26%|████████████████████████████████████████▍                                                                                                                 | 355/1352 [01:26<03:50,  4.33it/s]

neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9630, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9704, grad_fn=<MeanBackward0>)
pos tensor(0.9579, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9563, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<Mean

Training:  26%|████████████████████████████████████████▌                                                                                                                 | 356/1352 [01:26<03:57,  4.19it/s]

neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9597, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9650, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.8418, grad_fn=<Mean

Training:  26%|████████████████████████████████████████▋                                                                                                                 | 357/1352 [01:27<03:59,  4.16it/s]

neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9629, grad_fn=<MeanBackward0>)
pos tensor(0.9390, grad_fn=<MeanBackward0>)
neg tensor(0.9313, grad_fn=<MeanBackward0>)
pos tensor(0.9113, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<Mean

Training:  26%|████████████████████████████████████████▊                                                                                                                 | 358/1352 [01:27<04:08,  4.00it/s]

neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.7662, grad_fn=<MeanBackward0>)
pos tensor(0.9679, grad_fn=<MeanBackward0>)
neg tensor(0.9138, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<Mean

Training:  27%|████████████████████████████████████████▉                                                                                                                 | 359/1352 [01:27<04:03,  4.08it/s]

neg tensor(0.7019, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9952, grad_fn=<MeanBackward0>)
neg tensor(0.9645, grad_fn=<MeanBackward0>)
pos tensor(0.9416, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████                                                                                                                 | 360/1352 [01:28<04:08,  3.99it/s]

neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9553, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9709, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████                                                                                                                 | 361/1352 [01:28<04:09,  3.98it/s]

neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████▏                                                                                                                | 362/1352 [01:28<04:09,  3.97it/s]

neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████▎                                                                                                                | 363/1352 [01:28<03:56,  4.18it/s]

neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9943, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████▍                                                                                                                | 364/1352 [01:28<03:59,  4.12it/s]

neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.6299, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████▌                                                                                                                | 365/1352 [01:29<03:57,  4.16it/s]

neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9953, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████▋                                                                                                                | 366/1352 [01:29<03:55,  4.19it/s]

neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████▊                                                                                                                | 367/1352 [01:29<03:53,  4.22it/s]

neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<Mean

Training:  27%|█████████████████████████████████████████▉                                                                                                                | 368/1352 [01:29<04:15,  3.86it/s]

neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9344, grad_fn=<MeanBackward0>)
pos tensor(0.9956, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9974, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<Mean

Training:  27%|██████████████████████████████████████████                                                                                                                | 369/1352 [01:30<04:11,  3.91it/s]

neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<Mean

Training:  27%|██████████████████████████████████████████▏                                                                                                               | 370/1352 [01:30<04:24,  3.72it/s]

neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBac

Training:  27%|██████████████████████████████████████████▎                                                                                                               | 371/1352 [01:30<04:28,  3.65it/s]

neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<Mean

Training:  28%|██████████████████████████████████████████▎                                                                                                               | 372/1352 [01:31<04:28,  3.65it/s]

neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<Mean

Training:  28%|██████████████████████████████████████████▍                                                                                                               | 373/1352 [01:31<04:22,  3.73it/s]

neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.6298, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<Mean

Training:  28%|██████████████████████████████████████████▌                                                                                                               | 374/1352 [01:31<04:09,  3.93it/s]

neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.8384, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<Mean

Training:  28%|██████████████████████████████████████████▋                                                                                                               | 375/1352 [01:31<03:59,  4.09it/s]

neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9959, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<Mean

Training:  28%|██████████████████████████████████████████▊                                                                                                               | 376/1352 [01:32<04:03,  4.00it/s]

neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9149, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.8659, grad_fn=<Mean

Training:  28%|██████████████████████████████████████████▉                                                                                                               | 377/1352 [01:32<04:20,  3.75it/s]

neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9667, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(-0.0101, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9639, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<Mea

Training:  28%|███████████████████████████████████████████                                                                                                               | 378/1352 [01:32<04:16,  3.80it/s]

neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBack

Training:  28%|███████████████████████████████████████████▏                                                                                                              | 379/1352 [01:32<03:55,  4.14it/s]

neg tensor(0.7170, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(-0.1494, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.7930, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.8971, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<Mea

Training:  28%|███████████████████████████████████████████▎                                                                                                              | 380/1352 [01:33<04:07,  3.92it/s]

neg tensor(0.7681, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9738, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward

Training:  28%|███████████████████████████████████████████▍                                                                                                              | 381/1352 [01:33<04:12,  3.85it/s]

neg tensor(0.7660, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9732, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<Mean

Training:  28%|███████████████████████████████████████████▌                                                                                                              | 382/1352 [01:33<04:10,  3.87it/s]

neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9604, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<Mean

Training:  28%|███████████████████████████████████████████▋                                                                                                              | 383/1352 [01:33<04:00,  4.03it/s]

neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9764, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9683, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.8919, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9282, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<Mean

Training:  28%|███████████████████████████████████████████▋                                                                                                              | 384/1352 [01:34<04:09,  3.87it/s]

neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.8919, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9531, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9471, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9652, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<Mean

Training:  28%|███████████████████████████████████████████▊                                                                                                              | 385/1352 [01:34<03:56,  4.09it/s]

neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9175, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9704, grad_fn=<MeanBackward0>)
pos tensor(0.9613, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.8597, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.9660, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9335, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9577, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<Mean

Training:  29%|███████████████████████████████████████████▉                                                                                                              | 386/1352 [01:34<04:01,  4.00it/s]

neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9713, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<Mean

Training:  29%|████████████████████████████████████████████                                                                                                              | 387/1352 [01:34<04:03,  3.97it/s]

neg tensor(0.9573, grad_fn=<MeanBackward0>)
pos tensor(0.9283, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9775, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.7268, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<Mean

Training:  29%|████████████████████████████████████████████▏                                                                                                             | 388/1352 [01:35<03:53,  4.13it/s]

neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(0.9546, grad_fn=<MeanBackward0>)
neg tensor(0.5897, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.5919, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.8101, grad_fn=<Mean

Training:  29%|████████████████████████████████████████████▎                                                                                                             | 389/1352 [01:35<03:39,  4.40it/s]

neg tensor(-0.3480, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9386, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<Mea

Training:  29%|████████████████████████████████████████████▍                                                                                                             | 390/1352 [01:35<03:45,  4.27it/s]

neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.6264, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9632, grad_fn=<MeanBackward0>)
pos tensor(0.9541, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9667, grad_fn=<MeanBackward0>)
neg tensor(0.9464, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9761, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9841, grad_fn=<MeanBackward0>)
neg tensor(0.5932, grad_fn=<MeanBackward0>)
pos tensor(0.9686, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<Mean

Training:  29%|████████████████████████████████████████████▌                                                                                                             | 391/1352 [01:35<03:42,  4.33it/s]

neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9623, grad_fn=<MeanBackward0>)
neg tensor(0.9628, grad_fn=<MeanBackward0>)
pos tensor(0.9270, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9617, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9654, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9684, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<Mean

Training:  29%|████████████████████████████████████████████▋                                                                                                             | 392/1352 [01:35<03:38,  4.39it/s]

neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9683, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9945, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<Mean

Training:  29%|████████████████████████████████████████████▊                                                                                                             | 393/1352 [01:36<03:40,  4.35it/s]

neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9628, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9143, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBack

Training:  29%|████████████████████████████████████████████▉                                                                                                             | 394/1352 [01:36<03:53,  4.11it/s]

neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9640, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.1201, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<Mean

Training:  29%|████████████████████████████████████████████▉                                                                                                             | 395/1352 [01:36<03:48,  4.20it/s]

neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9668, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.8163, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9431, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBac

Training:  29%|█████████████████████████████████████████████                                                                                                             | 396/1352 [01:36<03:49,  4.16it/s]

neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9682, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.8784, grad_fn=<MeanBackward0>)
pos tensor(0.8901, grad_fn=<MeanBackward0>)
neg tensor(0.9005, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<Mean

Training:  29%|█████████████████████████████████████████████▏                                                                                                            | 397/1352 [01:37<04:05,  3.89it/s]

neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBack

Training:  29%|█████████████████████████████████████████████▎                                                                                                            | 398/1352 [01:37<03:58,  4.00it/s]

neg tensor(0.9732, grad_fn=<MeanBackward0>)
pos tensor(0.9769, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9610, grad_fn=<Mean

Training:  30%|█████████████████████████████████████████████▍                                                                                                            | 399/1352 [01:37<04:06,  3.87it/s]

neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9788, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<Mean

Training:  30%|█████████████████████████████████████████████▌                                                                                                            | 400/1352 [01:38<04:08,  3.83it/s]

neg tensor(0.8995, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9715, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.4213, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.8154, grad_fn=<Mean

Training:  30%|█████████████████████████████████████████████▋                                                                                                            | 401/1352 [01:38<04:05,  3.88it/s]

neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<Mean

Training:  30%|█████████████████████████████████████████████▊                                                                                                            | 402/1352 [01:38<03:50,  4.13it/s]

neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9959, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<Mean

Training:  30%|█████████████████████████████████████████████▉                                                                                                            | 403/1352 [01:38<03:45,  4.20it/s]

neg tensor(0.6949, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9806, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<Mean

Training:  30%|██████████████████████████████████████████████                                                                                                            | 404/1352 [01:38<03:50,  4.12it/s]

neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9663, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9582, grad_fn=<MeanBackward0>)
pos tensor(0.9979, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<Mean

Training:  30%|██████████████████████████████████████████████▏                                                                                                           | 405/1352 [01:39<03:42,  4.26it/s]

neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9697, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBack

Training:  30%|██████████████████████████████████████████████▏                                                                                                           | 406/1352 [01:39<03:49,  4.12it/s]

neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9713, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9668, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9634, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<Mean

Training:  30%|██████████████████████████████████████████████▎                                                                                                           | 407/1352 [01:39<03:30,  4.49it/s]

neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9963, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBack

Training:  30%|██████████████████████████████████████████████▍                                                                                                           | 408/1352 [01:39<03:25,  4.60it/s]

neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9370, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.7931, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(-0.5026, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)


Training:  30%|██████████████████████████████████████████████▌                                                                                                           | 409/1352 [01:40<03:36,  4.35it/s]

neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.8144, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.8905, grad_fn=<MeanBackward0>)
pos tensor(0.9718, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9627, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9585, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.8695, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBack

Training:  30%|██████████████████████████████████████████████▋                                                                                                           | 410/1352 [01:40<03:36,  4.35it/s]

neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9726, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.7945, grad_fn=<MeanBackward0>)
pos tensor(0.9362, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9659, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<Mean

Training:  30%|██████████████████████████████████████████████▊                                                                                                           | 411/1352 [01:40<03:41,  4.25it/s]

neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.9825, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.7015, grad_fn=<MeanBackward0>)
pos tensor(0.9261, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9297, grad_fn=<MeanBackward0>)
neg tensor(0.9651, grad_fn=<Mean

Training:  30%|██████████████████████████████████████████████▉                                                                                                           | 412/1352 [01:40<03:43,  4.21it/s]

neg tensor(0.9175, grad_fn=<MeanBackward0>)
pos tensor(0.9381, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.8901, grad_fn=<MeanBackward0>)
pos tensor(0.9383, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.8781, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.5879, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████                                                                                                           | 413/1352 [01:41<03:41,  4.25it/s]

neg tensor(0.7264, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9536, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9783, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9684, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9630, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████▏                                                                                                          | 414/1352 [01:41<03:43,  4.19it/s]

neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9703, grad_fn=<MeanBackward0>)
pos tensor(0.9252, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<MeanBackward0>)
pos tensor(0.9437, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9738, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9505, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9468, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████▎                                                                                                          | 415/1352 [01:41<03:44,  4.17it/s]

neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9442, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9590, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9601, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9167, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████▍                                                                                                          | 416/1352 [01:41<03:37,  4.31it/s]

neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9477, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9686, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.2980, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9591, grad_fn=<MeanBackward0>)
pos tensor(0.9419, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████▍                                                                                                          | 417/1352 [01:41<03:37,  4.30it/s]

neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.4988, grad_fn=<MeanBackward0>)
pos tensor(0.9100, grad_fn=<MeanBackward0>)
neg tensor(0.9683, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.6535, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.8726, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████▌                                                                                                          | 418/1352 [01:42<03:30,  4.43it/s]

neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9731, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████▋                                                                                                          | 419/1352 [01:42<03:32,  4.40it/s]

neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9819, grad_fn=<MeanBackward0>)
neg tensor(0.9668, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.9604, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9557, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9754, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████▊                                                                                                          | 420/1352 [01:42<03:35,  4.31it/s]

neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9698, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9204, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<Mean

Training:  31%|███████████████████████████████████████████████▉                                                                                                          | 421/1352 [01:42<03:31,  4.41it/s]

neg tensor(0.8152, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9722, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.8976, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9711, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.7585, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.1730, grad_fn=<MeanBackward0>)
pos tensor(0.9571, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<Mean

Training:  31%|████████████████████████████████████████████████                                                                                                          | 422/1352 [01:43<03:28,  4.46it/s]

neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.7147, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.0719, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<Mean

Training:  31%|████████████████████████████████████████████████▏                                                                                                         | 423/1352 [01:43<03:36,  4.29it/s]

neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9639, grad_fn=<MeanBackward0>)
pos tensor(0.9571, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9627, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBack

Training:  31%|████████████████████████████████████████████████▎                                                                                                         | 424/1352 [01:43<03:33,  4.35it/s]

neg tensor(0.9548, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.8422, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9594, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9800, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9201, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBack

Training:  31%|████████████████████████████████████████████████▍                                                                                                         | 425/1352 [01:43<03:34,  4.33it/s]

neg tensor(0.9634, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.8237, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<Mean

Training:  32%|████████████████████████████████████████████████▌                                                                                                         | 426/1352 [01:43<03:26,  4.50it/s]

neg tensor(0.9711, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.1068, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.8815, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<Mean

Training:  32%|████████████████████████████████████████████████▋                                                                                                         | 427/1352 [01:44<03:32,  4.35it/s]

neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9796, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.8806, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.7928, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9237, grad_fn=<MeanBack

Training:  32%|████████████████████████████████████████████████▊                                                                                                         | 428/1352 [01:44<03:21,  4.59it/s]

neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9461, grad_fn=<MeanBackward0>)
pos tensor(0.9970, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9655, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9166, grad_fn=<MeanBackward0>)
pos tensor(0.9236, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9259, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9006, grad_fn=<Mean

Training:  32%|████████████████████████████████████████████████▊                                                                                                         | 429/1352 [01:44<03:41,  4.18it/s]

neg tensor(0.8855, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9610, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9488, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.8943, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9748, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBack

Training:  32%|████████████████████████████████████████████████▉                                                                                                         | 430/1352 [01:44<03:34,  4.30it/s]

neg tensor(0.9293, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9671, grad_fn=<MeanBackward0>)
pos tensor(0.9630, grad_fn=<MeanBackward0>)
neg tensor(0.9654, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9674, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.5601, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<Mean

Training:  32%|█████████████████████████████████████████████████                                                                                                         | 431/1352 [01:45<03:34,  4.29it/s]

neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9557, grad_fn=<MeanBackward0>)
pos tensor(0.9414, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9559, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.8793, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.6261, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9705, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9440, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward

Training:  32%|█████████████████████████████████████████████████▏                                                                                                        | 432/1352 [01:45<03:36,  4.25it/s]

neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9516, grad_fn=<MeanBackward0>)
pos tensor(0.9730, grad_fn=<MeanBackward0>)
neg tensor(0.9708, grad_fn=<MeanBackward0>)
pos tensor(0.9555, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9627, grad_fn=<MeanBackward0>)
pos tensor(0.9381, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9611, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9316, grad_fn=<Mean

Training:  32%|█████████████████████████████████████████████████▎                                                                                                        | 433/1352 [01:45<03:32,  4.32it/s]

neg tensor(0.7393, grad_fn=<MeanBackward0>)
pos tensor(0.8856, grad_fn=<MeanBackward0>)
neg tensor(0.9577, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9664, grad_fn=<MeanBackward0>)
neg tensor(0.9617, grad_fn=<MeanBackward0>)
pos tensor(0.9655, grad_fn=<MeanBackward0>)
neg tensor(0.5621, grad_fn=<MeanBackward0>)
pos tensor(0.8476, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9716, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.6279, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9647, grad_fn=<MeanBackward0>)
pos tensor(0.8837, grad_fn=<MeanBackward0>)
neg tensor(0.6148, grad_fn=<Mean

Training:  32%|█████████████████████████████████████████████████▍                                                                                                        | 434/1352 [01:45<03:40,  4.17it/s]

neg tensor(0.9531, grad_fn=<MeanBackward0>)
pos tensor(0.9677, grad_fn=<MeanBackward0>)
neg tensor(0.8206, grad_fn=<MeanBackward0>)
pos tensor(0.7508, grad_fn=<MeanBackward0>)
neg tensor(0.9727, grad_fn=<MeanBackward0>)
pos tensor(0.9610, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9619, grad_fn=<MeanBackward0>)
pos tensor(0.9694, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9616, grad_fn=<MeanBackward0>)
neg tensor(0.8400, grad_fn=<MeanBackward0>)
pos tensor(0.9558, grad_fn=<MeanBackward0>)
neg tensor(0.9405, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<Mean

Training:  32%|█████████████████████████████████████████████████▌                                                                                                        | 435/1352 [01:46<03:33,  4.30it/s]

neg tensor(0.9645, grad_fn=<MeanBackward0>)
pos tensor(0.9409, grad_fn=<MeanBackward0>)
neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9457, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9451, grad_fn=<MeanBackward0>)
pos tensor(0.8982, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9720, grad_fn=<MeanBackward0>)
neg tensor(0.9409, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9602, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9658, grad_fn=<MeanBackward0>)
pos tensor(0.9574, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9625, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(0.9576, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<Mean

Training:  32%|█████████████████████████████████████████████████▋                                                                                                        | 436/1352 [01:46<03:30,  4.36it/s]

neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9495, grad_fn=<MeanBackward0>)
pos tensor(0.9110, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9602, grad_fn=<MeanBackward0>)
pos tensor(0.9287, grad_fn=<MeanBackward0>)
neg tensor(0.9324, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9841, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.5863, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.6709, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9541, grad_fn=<Mean

Training:  32%|█████████████████████████████████████████████████▊                                                                                                        | 437/1352 [01:46<03:22,  4.52it/s]

neg tensor(0.9403, grad_fn=<MeanBackward0>)
pos tensor(0.9741, grad_fn=<MeanBackward0>)
neg tensor(0.9769, grad_fn=<MeanBackward0>)
pos tensor(0.9515, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9433, grad_fn=<MeanBackward0>)
pos tensor(0.9351, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.8829, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9663, grad_fn=<MeanBackward0>)
pos tensor(0.9309, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<Mean

Training:  32%|█████████████████████████████████████████████████▉                                                                                                        | 438/1352 [01:46<03:27,  4.42it/s]

neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9555, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9242, grad_fn=<MeanBackward0>)
neg tensor(0.8085, grad_fn=<MeanBackward0>)
pos tensor(0.9968, grad_fn=<MeanBackward0>)
neg tensor(0.9612, grad_fn=<MeanBackward0>)
pos tensor(0.9409, grad_fn=<MeanBackward0>)
neg tensor(0.9482, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9764, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<Mean

Training:  32%|██████████████████████████████████████████████████                                                                                                        | 439/1352 [01:47<03:32,  4.31it/s]

neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9850, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9969, grad_fn=<MeanBackward0>)
neg tensor(0.9564, grad_fn=<MeanBackward0>)
pos tensor(0.9465, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.8800, grad_fn=<Mean

Training:  33%|██████████████████████████████████████████████████                                                                                                        | 440/1352 [01:47<03:52,  3.93it/s]

neg tensor(0.9211, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9588, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9520, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.6076, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9753, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<Mean

Training:  33%|██████████████████████████████████████████████████▏                                                                                                       | 441/1352 [01:47<04:07,  3.69it/s]

neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9770, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.7375, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9692, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9816, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<Mean

Training:  33%|██████████████████████████████████████████████████▎                                                                                                       | 442/1352 [01:47<04:15,  3.56it/s]

neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<Mean

Training:  33%|██████████████████████████████████████████████████▍                                                                                                       | 443/1352 [01:48<04:05,  3.71it/s]

neg tensor(-0.3403, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9787, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9744, grad_fn=<Mea

Training:  33%|██████████████████████████████████████████████████▌                                                                                                       | 444/1352 [01:48<04:07,  3.67it/s]

neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<Mean

Training:  33%|██████████████████████████████████████████████████▋                                                                                                       | 445/1352 [01:48<03:59,  3.79it/s]

neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.8762, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<Mean

Training:  33%|██████████████████████████████████████████████████▊                                                                                                       | 446/1352 [01:48<03:45,  4.02it/s]

neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9623, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.6172, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<Mean

Training:  33%|██████████████████████████████████████████████████▉                                                                                                       | 447/1352 [01:49<03:37,  4.17it/s]

neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<Mean

Training:  33%|███████████████████████████████████████████████████                                                                                                       | 448/1352 [01:49<03:40,  4.09it/s]

neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9459, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9943, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<Mean

Training:  33%|███████████████████████████████████████████████████▏                                                                                                      | 449/1352 [01:49<03:51,  3.90it/s]

neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.7396, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9943, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<Mean

Training:  33%|███████████████████████████████████████████████████▎                                                                                                      | 450/1352 [01:49<03:43,  4.04it/s]

neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<Mean

Training:  33%|███████████████████████████████████████████████████▎                                                                                                      | 451/1352 [01:50<03:41,  4.07it/s]

neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.3288, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBack

Training:  33%|███████████████████████████████████████████████████▍                                                                                                      | 452/1352 [01:50<03:43,  4.02it/s]

neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9687, grad_fn=<Mean

Training:  34%|███████████████████████████████████████████████████▌                                                                                                      | 453/1352 [01:50<03:40,  4.07it/s]

neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBac

Training:  34%|███████████████████████████████████████████████████▋                                                                                                      | 454/1352 [01:50<03:34,  4.19it/s]

neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.8873, grad_fn=<MeanBackward0>)
pos tensor(0.9980, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9955, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<Mean

Training:  34%|███████████████████████████████████████████████████▊                                                                                                      | 455/1352 [01:51<03:11,  4.68it/s]

tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)


Training:  34%|███████████████████████████████████████████████████▉                                                                                                      | 456/1352 [01:51<03:32,  4.22it/s]

neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9795, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<Mean

Training:  34%|████████████████████████████████████████████████████                                                                                                      | 457/1352 [01:51<03:27,  4.32it/s]

neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<Mean

Training:  34%|████████████████████████████████████████████████████▏                                                                                                     | 458/1352 [01:51<03:35,  4.14it/s]

neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9517, grad_fn=<MeanBackward0>)
pos tensor(0.9958, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<Mean

Training:  34%|████████████████████████████████████████████████████▎                                                                                                     | 459/1352 [01:52<04:10,  3.56it/s]

neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBack

Training:  34%|████████████████████████████████████████████████████▍                                                                                                     | 460/1352 [01:52<04:09,  3.58it/s]

neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.5498, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<Mean

Training:  34%|████████████████████████████████████████████████████▌                                                                                                     | 461/1352 [01:52<04:05,  3.62it/s]

neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<Mean

Training:  34%|████████████████████████████████████████████████████▌                                                                                                     | 462/1352 [01:52<04:01,  3.68it/s]

neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<Mean

Training:  34%|████████████████████████████████████████████████████▋                                                                                                     | 463/1352 [01:53<03:55,  3.77it/s]

neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9345, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<Mean

Training:  34%|████████████████████████████████████████████████████▊                                                                                                     | 464/1352 [01:53<04:10,  3.55it/s]

neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<Mean

Training:  34%|████████████████████████████████████████████████████▉                                                                                                     | 465/1352 [01:53<03:57,  3.74it/s]

neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(-1., grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackwar

Training:  34%|█████████████████████████████████████████████████████                                                                                                     | 466/1352 [01:53<03:44,  3.95it/s]

neg tensor(0.8137, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<Mean

Training:  35%|█████████████████████████████████████████████████████▏                                                                                                    | 467/1352 [01:54<03:49,  3.86it/s]

neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9101, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9765, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBack

Training:  35%|█████████████████████████████████████████████████████▎                                                                                                    | 468/1352 [01:54<03:34,  4.12it/s]

neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9975, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9952, grad_fn=<MeanBackward0>)
neg tensor(0.9766, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<Mean

Training:  35%|█████████████████████████████████████████████████████▍                                                                                                    | 469/1352 [01:54<03:32,  4.16it/s]

neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<Mean

Training:  35%|█████████████████████████████████████████████████████▌                                                                                                    | 470/1352 [01:54<03:17,  4.47it/s]

neg tensor(0.2910, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9794, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<Mean

Training:  35%|█████████████████████████████████████████████████████▋                                                                                                    | 471/1352 [01:55<03:36,  4.06it/s]

neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.8969, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.7284, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<Mean

Training:  35%|█████████████████████████████████████████████████████▊                                                                                                    | 472/1352 [01:55<03:52,  3.78it/s]

neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.4226, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9586, grad_fn=<MeanBackward0>)
neg tensor(0.9725, grad_fn=<MeanBackward0>)
pos tensor(0.9977, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<Mean

Training:  35%|█████████████████████████████████████████████████████▉                                                                                                    | 473/1352 [01:55<03:45,  3.89it/s]

neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9579, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9408, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<Mean

Training:  35%|█████████████████████████████████████████████████████▉                                                                                                    | 474/1352 [01:55<03:31,  4.14it/s]

neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9942, grad_fn=<MeanBackward0>)
neg tensor(0.8418, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9063, grad_fn=<MeanBackward0>)
pos tensor(0.9947, grad_fn=<MeanBackward0>)
neg tensor(0.8802, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9943, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<Mean

Training:  35%|██████████████████████████████████████████████████████                                                                                                    | 475/1352 [01:56<03:19,  4.40it/s]

neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9663, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)


Training:  35%|██████████████████████████████████████████████████████▏                                                                                                   | 476/1352 [01:56<03:14,  4.50it/s]

neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9595, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9633, grad_fn=<MeanBackward0>)
pos tensor(0.9764, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<Mean

Training:  35%|██████████████████████████████████████████████████████▎                                                                                                   | 477/1352 [01:56<03:42,  3.93it/s]

neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.7348, grad_fn=<MeanBackward0>)
pos tensor(0.9294, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<Mean

Training:  35%|██████████████████████████████████████████████████████▍                                                                                                   | 478/1352 [01:56<03:46,  3.86it/s]

neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.3282, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9761, grad_fn=<Mean

Training:  35%|██████████████████████████████████████████████████████▌                                                                                                   | 479/1352 [01:57<03:54,  3.73it/s]

neg tensor(0.9673, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9815, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9022, grad_fn=<MeanBackward0>)
pos tensor(0.9666, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9699, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<Mean

Training:  36%|██████████████████████████████████████████████████████▋                                                                                                   | 480/1352 [01:57<03:51,  3.76it/s]

neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9809, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9718, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.8690, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<Mean

Training:  36%|██████████████████████████████████████████████████████▊                                                                                                   | 481/1352 [01:57<03:27,  4.20it/s]

neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9314, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.7447, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<Mean

Training:  36%|██████████████████████████████████████████████████████▉                                                                                                   | 482/1352 [01:57<03:13,  4.50it/s]

neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.6652, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9058, grad_fn=<MeanBackward0>)
pos tensor(0.9363, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9446, grad_fn=<MeanBackward0>)


Training:  36%|███████████████████████████████████████████████████████                                                                                                   | 483/1352 [01:58<03:14,  4.47it/s]

pos tensor(0.9245, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9630, grad_fn=<MeanBackward0>)
pos tensor(0.9631, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9561, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)


Training:  36%|███████████████████████████████████████████████████████▏                                                                                                  | 484/1352 [01:58<03:14,  4.47it/s]

neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9569, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.6533, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<Mean

Training:  36%|███████████████████████████████████████████████████████▏                                                                                                  | 485/1352 [01:58<03:05,  4.67it/s]

neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9942, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9791, grad_fn=<MeanBackward0>)
neg tensor(0.9835, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<Mean

Training:  36%|███████████████████████████████████████████████████████▎                                                                                                  | 486/1352 [01:58<03:13,  4.46it/s]

neg tensor(0.9614, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.6878, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9773, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBack

Training:  36%|███████████████████████████████████████████████████████▍                                                                                                  | 487/1352 [01:58<03:02,  4.73it/s]

neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9688, grad_fn=<MeanBackward0>)
pos tensor(0.9992, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9858, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<Mean

Training:  36%|███████████████████████████████████████████████████████▌                                                                                                  | 488/1352 [01:59<03:21,  4.28it/s]

neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9661, grad_fn=<MeanBackward0>)
pos tensor(0.9497, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9734, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9743, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<Mean

Training:  36%|███████████████████████████████████████████████████████▋                                                                                                  | 489/1352 [01:59<03:12,  4.49it/s]

neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9564, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.7067, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<Mean

Training:  36%|███████████████████████████████████████████████████████▊                                                                                                  | 490/1352 [01:59<03:15,  4.41it/s]

neg tensor(0.8380, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.8970, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9558, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.8620, grad_fn=<MeanBackward0>)
pos tensor(0.9947, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9689, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9226, grad_fn=<Mean

Training:  36%|███████████████████████████████████████████████████████▉                                                                                                  | 491/1352 [01:59<03:09,  4.54it/s]

neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9715, grad_fn=<MeanBackward0>)
pos tensor(0.9767, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.6142, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.7438, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9667, grad_fn=<MeanBack

Training:  36%|████████████████████████████████████████████████████████                                                                                                  | 492/1352 [02:00<02:54,  4.94it/s]

pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9823, grad_fn=<MeanBackward0>)
neg tensor(0.8969, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)


Training:  36%|████████████████████████████████████████████████████████▏                                                                                                 | 493/1352 [02:00<03:02,  4.72it/s]

neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9620, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9812, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.7294, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9003, grad_fn=<MeanBackward0>)
pos tensor(0.9484, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9185, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9655, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)


Training:  37%|████████████████████████████████████████████████████████▎                                                                                                 | 494/1352 [02:00<03:06,  4.61it/s]

neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.8958, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9689, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.9500, grad_fn=<MeanBackward0>)
pos tensor(0.9436, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.8753, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9583, grad_fn=<MeanBackward0>)
pos tensor(0.9462, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<Mean

Training:  37%|████████████████████████████████████████████████████████▍                                                                                                 | 495/1352 [02:00<03:23,  4.22it/s]

neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9728, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9772, grad_fn=<MeanBackward0>)
pos tensor(0.9641, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9130, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9695, grad_fn=<MeanBack

Training:  37%|████████████████████████████████████████████████████████▍                                                                                                 | 496/1352 [02:00<03:20,  4.26it/s]

neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9711, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9841, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(0.9548, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9637, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9787, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<Mean

Training:  37%|████████████████████████████████████████████████████████▌                                                                                                 | 497/1352 [02:01<03:31,  4.05it/s]

neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.7916, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9431, grad_fn=<MeanBackward0>)
pos tensor(0.9145, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9665, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9574, grad_fn=<MeanBackward0>)
pos tensor(0.8986, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.4355, grad_fn=<Mean

Training:  37%|████████████████████████████████████████████████████████▋                                                                                                 | 498/1352 [02:01<03:44,  3.80it/s]

neg tensor(0.9000, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9770, grad_fn=<MeanBackward0>)
pos tensor(0.9520, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.8117, grad_fn=<MeanBackward0>)
pos tensor(0.9368, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9691, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9497, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9716, grad_fn=<Mean

Training:  37%|████████████████████████████████████████████████████████▊                                                                                                 | 499/1352 [02:01<03:37,  3.91it/s]

neg tensor(0.9792, grad_fn=<MeanBackward0>)
pos tensor(0.9819, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9363, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.5849, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.6988, grad_fn=<MeanBackward0>)
pos tensor(0.9497, grad_fn=<MeanBackward0>)
neg tensor(0.9784, grad_fn=<MeanBackward0>)
pos tensor(0.9837, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.8912, grad_fn=<MeanBackward0>)
pos tensor(0.8842, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<Mean

Training:  37%|████████████████████████████████████████████████████████▉                                                                                                 | 500/1352 [02:01<03:19,  4.27it/s]

neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9705, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9443, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.8472, grad_fn=<Mean

Training:  37%|█████████████████████████████████████████████████████████                                                                                                 | 501/1352 [02:02<03:30,  4.04it/s]

neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9627, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.6797, grad_fn=<Mean

Training:  37%|█████████████████████████████████████████████████████████▏                                                                                                | 502/1352 [02:02<03:37,  3.91it/s]

neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9486, grad_fn=<MeanBackward0>)
pos tensor(0.9801, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9549, grad_fn=<MeanBackward0>)
pos tensor(0.9481, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<Mean

Training:  37%|█████████████████████████████████████████████████████████▎                                                                                                | 503/1352 [02:02<03:32,  4.00it/s]

neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.7927, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<Mean

Training:  37%|█████████████████████████████████████████████████████████▍                                                                                                | 504/1352 [02:02<03:16,  4.32it/s]

pos tensor(0.9847, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9840, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9974, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.8779, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<Mean

Training:  37%|█████████████████████████████████████████████████████████▌                                                                                                | 505/1352 [02:03<03:18,  4.26it/s]

neg tensor(0.7273, grad_fn=<MeanBackward0>)
pos tensor(0.9579, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9846, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9958, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9553, grad_fn=<MeanBackward0>)
neg tensor(0.1970, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9964, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<Mean

Training:  37%|█████████████████████████████████████████████████████████▋                                                                                                | 506/1352 [02:03<03:28,  4.06it/s]

neg tensor(0.9958, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9278, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9733, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9722, grad_fn=<MeanBackward0>)
neg tensor(0.9632, grad_fn=<MeanBackward0>)
pos tensor(0.9578, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<Mean

Training:  38%|█████████████████████████████████████████████████████████▊                                                                                                | 507/1352 [02:03<03:23,  4.15it/s]

neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.8414, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.7247, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward

Training:  38%|█████████████████████████████████████████████████████████▊                                                                                                | 508/1352 [02:03<03:21,  4.18it/s]

neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9955, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9964, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<Mean

Training:  38%|█████████████████████████████████████████████████████████▉                                                                                                | 509/1352 [02:04<03:08,  4.46it/s]

neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9589, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9736, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9571, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<Mean

Training:  38%|██████████████████████████████████████████████████████████                                                                                                | 510/1352 [02:04<03:10,  4.42it/s]

neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9544, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9448, grad_fn=<MeanBackward0>)
pos tensor(0.9991, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9745, grad_fn=<MeanBackward0>)
neg tensor(0.5773, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<Mean

Training:  38%|██████████████████████████████████████████████████████████▏                                                                                               | 511/1352 [02:04<02:58,  4.72it/s]

tensor(0.9945, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9734, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9527, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg 

Training:  38%|██████████████████████████████████████████████████████████▎                                                                                               | 512/1352 [02:04<02:59,  4.68it/s]

tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9637, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9715, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9719, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)


Training:  38%|██████████████████████████████████████████████████████████▍                                                                                               | 513/1352 [02:05<03:17,  4.26it/s]

neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9737, grad_fn=<MeanBackward0>)
pos tensor(0.9753, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9746, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<Mean

Training:  38%|██████████████████████████████████████████████████████████▌                                                                                               | 514/1352 [02:05<03:13,  4.34it/s]

neg tensor(0.9837, grad_fn=<MeanBackward0>)
pos tensor(0.9666, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9584, grad_fn=<MeanBackward0>)
pos tensor(0.9637, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9497, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.7915, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<MeanBack

Training:  38%|██████████████████████████████████████████████████████████▋                                                                                               | 515/1352 [02:05<03:10,  4.39it/s]

neg tensor(0.9154, grad_fn=<MeanBackward0>)
pos tensor(0.9630, grad_fn=<MeanBackward0>)
neg tensor(0.9834, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9802, grad_fn=<MeanBackward0>)
pos tensor(0.9738, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9599, grad_fn=<MeanBackward0>)
pos tensor(0.9949, grad_fn=<MeanBackward0>)
neg tensor(0.9785, grad_fn=<MeanBackward0>)
pos tensor(0.9378, grad_fn=<MeanBackward0>)
neg tensor(0.9639, grad_fn=<MeanBackward0>)
pos tensor(0.9562, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9635, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<Mean

Training:  38%|██████████████████████████████████████████████████████████▊                                                                                               | 516/1352 [02:05<03:15,  4.27it/s]

neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9700, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.8762, grad_fn=<MeanBackward0>)
pos tensor(0.9417, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9842, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<Mean

Training:  38%|██████████████████████████████████████████████████████████▉                                                                                               | 517/1352 [02:05<03:03,  4.55it/s]

neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9337, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9906, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9817, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9607, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9432, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9632, grad_fn=<Mean

Training:  38%|███████████████████████████████████████████████████████████                                                                                               | 518/1352 [02:06<03:19,  4.19it/s]

neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9757, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.7744, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.8342, grad_fn=<MeanBackward0>)
pos tensor(0.9965, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9820, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9766, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<Mean

Training:  38%|███████████████████████████████████████████████████████████                                                                                               | 519/1352 [02:06<03:20,  4.15it/s]

neg tensor(0.9659, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9958, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9690, grad_fn=<MeanBackward0>)
pos tensor(0.9798, grad_fn=<MeanBackward0>)
neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9685, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<Mean

Training:  38%|███████████████████████████████████████████████████████████▏                                                                                              | 520/1352 [02:06<03:10,  4.36it/s]

neg tensor(0.9744, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9799, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.2963, grad_fn=<MeanBackward0>)
pos tensor(0.8935, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.7573, grad_fn=<Mean

Training:  39%|███████████████████████████████████████████████████████████▎                                                                                              | 521/1352 [02:06<03:25,  4.05it/s]

neg tensor(0.9686, grad_fn=<MeanBackward0>)
pos tensor(0.9465, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9670, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9953, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9687, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9778, grad_fn=<MeanBackward0>)
neg tensor(0.9526, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<Mean

Training:  39%|███████████████████████████████████████████████████████████▍                                                                                              | 522/1352 [02:07<03:26,  4.01it/s]

neg tensor(0.9634, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9203, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9876, grad_fn=<MeanBackward0>)
pos tensor(0.9841, grad_fn=<MeanBackward0>)
neg tensor(0.9791, grad_fn=<MeanBackward0>)
pos tensor(0.9774, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9459, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<Mean

Training:  39%|███████████████████████████████████████████████████████████▌                                                                                              | 523/1352 [02:07<03:22,  4.09it/s]

neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.7063, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9513, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9295, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9831, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9835, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9819, grad_fn=<MeanBackward0>)
neg tensor(0.9809, grad_fn=<MeanBack

Training:  39%|███████████████████████████████████████████████████████████▋                                                                                              | 524/1352 [02:07<03:16,  4.22it/s]

neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9711, grad_fn=<MeanBackward0>)
neg tensor(0.9666, grad_fn=<MeanBackward0>)
pos tensor(0.9622, grad_fn=<MeanBackward0>)
neg tensor(0.9758, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9760, grad_fn=<MeanBackward0>)
pos tensor(0.9737, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9335, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9883, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<Mean

Training:  39%|███████████████████████████████████████████████████████████▊                                                                                              | 525/1352 [02:07<03:34,  3.86it/s]

neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9178, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9964, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9680, grad_fn=<MeanBackward0>)
neg tensor(0.9542, grad_fn=<MeanBackward0>)
pos tensor(0.9303, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<Mean

Training:  39%|███████████████████████████████████████████████████████████▉                                                                                              | 526/1352 [02:08<03:31,  3.90it/s]

neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9098, grad_fn=<MeanBackward0>)
pos tensor(0.9676, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.8981, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9905, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9872, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9801, grad_fn=<Mean

Training:  39%|████████████████████████████████████████████████████████████                                                                                              | 527/1352 [02:08<03:18,  4.15it/s]

neg tensor(0.9790, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9368, grad_fn=<MeanBackward0>)
pos tensor(0.9488, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9336, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<Mean

Training:  39%|████████████████████████████████████████████████████████████▏                                                                                             | 528/1352 [02:08<03:05,  4.43it/s]

neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9870, grad_fn=<MeanBackward0>)
neg tensor(0.9518, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.8958, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9468, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9536, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9080, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)


Training:  39%|████████████████████████████████████████████████████████████▎                                                                                             | 529/1352 [02:08<03:04,  4.45it/s]

neg tensor(0.9833, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9886, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9856, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.2986, grad_fn=<MeanBackward0>)
pos tensor(0.8574, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<Mean

Training:  39%|████████████████████████████████████████████████████████████▎                                                                                             | 530/1352 [02:09<03:05,  4.44it/s]

neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9674, grad_fn=<MeanBackward0>)
pos tensor(0.9633, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9450, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9659, grad_fn=<MeanBackward0>)
neg tensor(0.9626, grad_fn=<MeanBackward0>)
pos tensor(0.9328, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.8733, grad_fn=<Mean

Training:  39%|████████████████████████████████████████████████████████████▍                                                                                             | 531/1352 [02:09<03:03,  4.48it/s]

neg tensor(0.9706, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9798, grad_fn=<MeanBackward0>)
pos tensor(0.9672, grad_fn=<MeanBackward0>)
neg tensor(0.9702, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9628, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9812, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<Mean

Training:  39%|████████████████████████████████████████████████████████████▌                                                                                             | 532/1352 [02:09<03:17,  4.15it/s]

neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9881, grad_fn=<MeanBackward0>)
pos tensor(0.9729, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9736, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.8288, grad_fn=<MeanBackward0>)
pos tensor(0.9962, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9678, grad_fn=<MeanBackward0>)
pos tensor(0.9570, grad_fn=<MeanBackward0>)
neg tensor(0.7401, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBack

Training:  39%|████████████████████████████████████████████████████████████▋                                                                                             | 533/1352 [02:09<03:13,  4.23it/s]

neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9333, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9192, grad_fn=<MeanBackward0>)
pos tensor(0.9554, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9902, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9677, grad_fn=<MeanBackward0>)
pos tensor(0.9706, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9620, grad_fn=<Mean

Training:  39%|████████████████████████████████████████████████████████████▊                                                                                             | 534/1352 [02:09<03:05,  4.40it/s]

neg tensor(0.9351, grad_fn=<MeanBackward0>)
pos tensor(0.8859, grad_fn=<MeanBackward0>)
neg tensor(0.9625, grad_fn=<MeanBackward0>)
pos tensor(0.9607, grad_fn=<MeanBackward0>)
neg tensor(0.9694, grad_fn=<MeanBackward0>)
pos tensor(0.9618, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9714, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9664, grad_fn=<MeanBackward0>)
pos tensor(0.9375, grad_fn=<MeanBackward0>)
neg tensor(0.4896, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9599, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9727, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<Mean

Training:  40%|████████████████████████████████████████████████████████████▉                                                                                             | 535/1352 [02:10<03:01,  4.50it/s]

neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9957, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9760, grad_fn=<MeanBackward0>)
neg tensor(0.9826, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9648, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.8900, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.2880, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<Mean

Training:  40%|█████████████████████████████████████████████████████████████                                                                                             | 536/1352 [02:10<03:18,  4.12it/s]

neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9371, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9774, grad_fn=<MeanBackward0>)
pos tensor(0.9690, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.8367, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9762, grad_fn=<MeanBackward0>)
pos tensor(0.9655, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBack

Training:  40%|█████████████████████████████████████████████████████████████▏                                                                                            | 537/1352 [02:10<03:20,  4.06it/s]

neg tensor(0.9390, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9370, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9818, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9848, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9745, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9665, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9681, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBack

Training:  40%|█████████████████████████████████████████████████████████████▎                                                                                            | 538/1352 [02:11<03:31,  3.86it/s]

neg tensor(0.9155, grad_fn=<MeanBackward0>)
pos tensor(0.9962, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9840, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9742, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9813, grad_fn=<MeanBackward0>)
pos tensor(0.9877, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9578, grad_fn=<MeanBackward0>)
pos tensor(0.9751, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9465, grad_fn=<Mean

Training:  40%|█████████████████████████████████████████████████████████████▍                                                                                            | 539/1352 [02:11<03:34,  3.79it/s]

neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9778, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9824, grad_fn=<MeanBackward0>)
pos tensor(0.9776, grad_fn=<MeanBackward0>)
neg tensor(0.8421, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.7788, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9963, grad_fn=<MeanBackward0>)
neg tensor(0.9508, grad_fn=<MeanBackward0>)
pos tensor(0.9715, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<Mean

Training:  40%|█████████████████████████████████████████████████████████████▌                                                                                            | 540/1352 [02:11<03:24,  3.97it/s]

neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.6327, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9834, grad_fn=<MeanBackward0>)
neg tensor(0.9907, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<Mean

Training:  40%|█████████████████████████████████████████████████████████████▌                                                                                            | 541/1352 [02:11<03:21,  4.02it/s]

neg tensor(0.5963, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9752, grad_fn=<MeanBackward0>)
neg tensor(0.9804, grad_fn=<MeanBackward0>)
pos tensor(0.9606, grad_fn=<MeanBackward0>)
neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9659, grad_fn=<MeanBackward0>)
pos tensor(0.9717, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9961, grad_fn=<MeanBackward0>)
neg tensor(0.9896, grad_fn=<Mean

Training:  40%|█████████████████████████████████████████████████████████████▋                                                                                            | 542/1352 [02:11<03:16,  4.13it/s]

neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.9445, grad_fn=<MeanBackward0>)
pos tensor(0.9953, grad_fn=<MeanBackward0>)
neg tensor(0.9972, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9958, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9713, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<Mean

Training:  40%|█████████████████████████████████████████████████████████████▊                                                                                            | 543/1352 [02:12<03:10,  4.25it/s]

neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9958, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9654, grad_fn=<MeanBackward0>)
neg tensor(0.8374, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9969, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<Mean

Training:  40%|█████████████████████████████████████████████████████████████▉                                                                                            | 544/1352 [02:12<03:06,  4.33it/s]

neg tensor(0.8098, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9000, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.8657, grad_fn=<MeanBackward0>)
pos tensor(0.9522, grad_fn=<MeanBackward0>)
neg tensor(0.9295, grad_fn=<MeanBackward0>)
pos tensor(0.9288, grad_fn=<MeanBackward0>)
neg tensor(0.8732, grad_fn=<MeanBackward0>)
pos tensor(0.9986, grad_fn=<MeanBackward0>)
neg tensor(-0.0025, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBac

Training:  40%|██████████████████████████████████████████████████████████████                                                                                            | 545/1352 [02:12<03:07,  4.30it/s]

neg tensor(0.7402, grad_fn=<MeanBackward0>)
pos tensor(0.9889, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9797, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9608, grad_fn=<MeanBackward0>)
pos tensor(0.9523, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9619, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<MeanBackward0>)
pos tensor(0.9953, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<Mean

Training:  40%|██████████████████████████████████████████████████████████████▏                                                                                           | 546/1352 [02:12<03:16,  4.10it/s]

neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9966, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.8844, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9816, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9711, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9615, grad_fn=<MeanBackward0>)
pos tensor(0.9719, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<Mean

Training:  40%|██████████████████████████████████████████████████████████████▎                                                                                           | 547/1352 [02:13<03:14,  4.14it/s]

neg tensor(0.9756, grad_fn=<MeanBackward0>)
pos tensor(0.9756, grad_fn=<MeanBackward0>)
neg tensor(0.8758, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.5973, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9628, grad_fn=<MeanBackward0>)
pos tensor(0.9827, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9869, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.8503, grad_fn=<Mean

Training:  41%|██████████████████████████████████████████████████████████████▍                                                                                           | 548/1352 [02:13<03:06,  4.32it/s]

neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9441, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBackward0>)
pos tensor(0.9814, grad_fn=<MeanBackward0>)
neg tensor(0.9362, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9968, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.7872, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9756, grad_fn=<Mean

Training:  41%|██████████████████████████████████████████████████████████████▌                                                                                           | 549/1352 [02:13<03:12,  4.17it/s]

neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9967, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9872, grad_fn=<MeanBackward0>)
neg tensor(0.9796, grad_fn=<MeanBackward0>)
pos tensor(0.9725, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9517, grad_fn=<MeanBackward0>)
pos tensor(0.9781, grad_fn=<MeanBackward0>)
neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9894, grad_fn=<Mean

Training:  41%|██████████████████████████████████████████████████████████████▋                                                                                           | 550/1352 [02:13<03:33,  3.75it/s]

neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9971, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9728, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9458, grad_fn=<MeanBackward0>)
pos tensor(0.9471, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9627, grad_fn=<MeanBackward0>)
neg tensor(0.9691, grad_fn=<Mean

Training:  41%|██████████████████████████████████████████████████████████████▊                                                                                           | 551/1352 [02:14<03:22,  3.96it/s]

neg tensor(0.7739, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9533, grad_fn=<MeanBackward0>)
pos tensor(0.9876, grad_fn=<MeanBackward0>)
neg tensor(0.9969, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9244, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9755, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9807, grad_fn=<MeanBackward0>)
neg tensor(0.9964, grad_fn=<Mean

Training:  41%|██████████████████████████████████████████████████████████████▉                                                                                           | 552/1352 [02:14<03:08,  4.25it/s]

neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9584, grad_fn=<MeanBackward0>)
neg tensor(0.9972, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.7908, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9849, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9534, grad_fn=<Mean

Training:  41%|██████████████████████████████████████████████████████████████▉                                                                                           | 553/1352 [02:14<03:09,  4.22it/s]

neg tensor(0.9494, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9814, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9500, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9969, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9807, grad_fn=<MeanBackward0>)
pos tensor(0.9615, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<Mean

Training:  41%|███████████████████████████████████████████████████████████████                                                                                           | 554/1352 [02:14<03:27,  3.84it/s]

neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9605, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<Mean

Training:  41%|███████████████████████████████████████████████████████████████▏                                                                                          | 555/1352 [02:15<03:26,  3.86it/s]

neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9852, grad_fn=<MeanBackward0>)
neg tensor(0.8385, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9971, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9751, grad_fn=<MeanBackward0>)
pos tensor(0.9942, grad_fn=<MeanBackward0>)
neg tensor(0.8078, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9473, grad_fn=<MeanBackward0>)
pos tensor(0.9526, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<Mean

Training:  41%|███████████████████████████████████████████████████████████████▎                                                                                          | 556/1352 [02:15<03:04,  4.33it/s]

neg tensor(0.8940, grad_fn=<MeanBackward0>)
pos tensor(0.9942, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9513, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)


Training:  41%|███████████████████████████████████████████████████████████████▍                                                                                          | 557/1352 [02:15<03:07,  4.24it/s]

neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9622, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9333, grad_fn=<MeanBackward0>)
pos tensor(0.9194, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9265, grad_fn=<MeanBackward0>)
pos tensor(0.9527, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9670, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9091, grad_fn=<Mean

Training:  41%|███████████████████████████████████████████████████████████████▌                                                                                          | 558/1352 [02:15<03:03,  4.33it/s]

neg tensor(0.7328, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9919, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.0282, grad_fn=<MeanBackward0>)
pos tensor(0.9804, grad_fn=<MeanBackward0>)
neg tensor(0.8583, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9624, grad_fn=<MeanBackward0>)
neg tensor(0.9622, grad_fn=<MeanBackward0>)
pos tensor(0.9768, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9675, grad_fn=<Mean

Training:  41%|███████████████████████████████████████████████████████████████▋                                                                                          | 559/1352 [02:16<03:07,  4.23it/s]

neg tensor(0.9544, grad_fn=<MeanBackward0>)
pos tensor(0.9810, grad_fn=<MeanBackward0>)
neg tensor(0.9113, grad_fn=<MeanBackward0>)
pos tensor(0.9784, grad_fn=<MeanBackward0>)
neg tensor(0.9555, grad_fn=<MeanBackward0>)
pos tensor(0.9806, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9790, grad_fn=<MeanBackward0>)
neg tensor(0.9300, grad_fn=<MeanBackward0>)
pos tensor(0.9590, grad_fn=<MeanBackward0>)
neg tensor(0.9890, grad_fn=<Mean

Training:  41%|███████████████████████████████████████████████████████████████▊                                                                                          | 560/1352 [02:16<03:12,  4.12it/s]

neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9713, grad_fn=<MeanBackward0>)
neg tensor(0.9509, grad_fn=<MeanBackward0>)
pos tensor(0.9749, grad_fn=<MeanBackward0>)
neg tensor(0.9767, grad_fn=<MeanBackward0>)
pos tensor(0.9576, grad_fn=<MeanBackward0>)
neg tensor(0.9712, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9958, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9777, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9723, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9762, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<Mean

Training:  41%|███████████████████████████████████████████████████████████████▉                                                                                          | 561/1352 [02:16<03:27,  3.81it/s]

neg tensor(0.9591, grad_fn=<MeanBackward0>)
pos tensor(0.9464, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9496, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9630, grad_fn=<MeanBackward0>)
pos tensor(0.9557, grad_fn=<MeanBackward0>)
neg tensor(0.9388, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9824, grad_fn=<MeanBackward0>)
neg tensor(0.9723, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9964, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9585, grad_fn=<MeanBackward0>)
pos tensor(0.9605, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████                                                                                          | 562/1352 [02:16<03:22,  3.91it/s]

neg tensor(0.9340, grad_fn=<MeanBackward0>)
pos tensor(0.8984, grad_fn=<MeanBackward0>)
neg tensor(0.9660, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9649, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9477, grad_fn=<MeanBackward0>)
pos tensor(0.9442, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9861, grad_fn=<MeanBackward0>)
pos tensor(0.9708, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9531, grad_fn=<MeanBackward0>)
pos tensor(0.9192, grad_fn=<MeanBackward0>)
neg tensor(0.9492, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████▏                                                                                         | 563/1352 [02:17<03:25,  3.84it/s]

neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.8735, grad_fn=<MeanBackward0>)
pos tensor(0.9975, grad_fn=<MeanBackward0>)
neg tensor(0.9377, grad_fn=<MeanBackward0>)
pos tensor(0.9444, grad_fn=<MeanBackward0>)
neg tensor(0.9815, grad_fn=<MeanBackward0>)
pos tensor(0.9712, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9744, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.9847, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9398, grad_fn=<MeanBackward0>)
pos tensor(0.9638, grad_fn=<MeanBackward0>)
neg tensor(0.9857, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9549, grad_fn=<MeanBackward0>)
pos tensor(0.9279, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████▏                                                                                         | 564/1352 [02:17<03:19,  3.94it/s]

neg tensor(0.9128, grad_fn=<MeanBackward0>)
pos tensor(0.9821, grad_fn=<MeanBackward0>)
neg tensor(0.9363, grad_fn=<MeanBackward0>)
pos tensor(0.9460, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9656, grad_fn=<MeanBackward0>)
neg tensor(0.9780, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9793, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9408, grad_fn=<MeanBackward0>)
pos tensor(0.9779, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9838, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9730, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████▎                                                                                         | 565/1352 [02:17<03:10,  4.13it/s]

neg tensor(0.9865, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9341, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9619, grad_fn=<MeanBackward0>)
pos tensor(0.9472, grad_fn=<MeanBackward0>)
neg tensor(0.2623, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9871, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9896, grad_fn=<MeanBackward0>)
neg tensor(0.9122, grad_fn=<MeanBackward0>)
pos tensor(0.9955, grad_fn=<MeanBackward0>)
neg tensor(0.6072, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.8764, grad_fn=<MeanBackward0>)
pos tensor(0.9497, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9860, grad_fn=<MeanBackward0>)
neg tensor(0.9852, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████▍                                                                                         | 566/1352 [02:17<03:02,  4.31it/s]

neg tensor(0.9637, grad_fn=<MeanBackward0>)
pos tensor(0.9528, grad_fn=<MeanBackward0>)
neg tensor(0.7118, grad_fn=<MeanBackward0>)
pos tensor(0.9125, grad_fn=<MeanBackward0>)
neg tensor(0.9241, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9626, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.6296, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9645, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.7630, grad_fn=<MeanBackward0>)
pos tensor(0.9398, grad_fn=<MeanBackward0>)
neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9754, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████▌                                                                                         | 567/1352 [02:18<03:07,  4.18it/s]

neg tensor(0.9776, grad_fn=<MeanBackward0>)
pos tensor(0.9587, grad_fn=<MeanBackward0>)
neg tensor(0.8407, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.8658, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9130, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.5773, grad_fn=<MeanBackward0>)
pos tensor(0.9703, grad_fn=<MeanBackward0>)
neg tensor(0.9622, grad_fn=<MeanBackward0>)
pos tensor(0.9407, grad_fn=<MeanBackward0>)
neg tensor(0.9748, grad_fn=<MeanBackward0>)
pos tensor(0.9669, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████▋                                                                                         | 568/1352 [02:18<03:30,  3.72it/s]

neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9866, grad_fn=<MeanBackward0>)
pos tensor(0.9757, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.7121, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9773, grad_fn=<MeanBackward0>)
pos tensor(0.9696, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9209, grad_fn=<MeanBackward0>)
pos tensor(0.9107, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9841, grad_fn=<MeanBackward0>)
neg tensor(0.9717, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████▊                                                                                         | 569/1352 [02:18<03:22,  3.87it/s]

neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9858, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9438, grad_fn=<MeanBackward0>)
neg tensor(0.8897, grad_fn=<MeanBackward0>)
pos tensor(0.9543, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9920, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9599, grad_fn=<MeanBackward0>)
pos tensor(0.9953, grad_fn=<MeanBackward0>)
neg tensor(0.9571, grad_fn=<MeanBackward0>)
pos tensor(0.9407, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9661, grad_fn=<MeanBackward0>)
pos tensor(0.9121, grad_fn=<MeanBackward0>)
neg tensor(0.9799, grad_fn=<MeanBackward0>)
pos tensor(0.9763, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<Mean

Training:  42%|████████████████████████████████████████████████████████████████▉                                                                                         | 570/1352 [02:18<03:25,  3.80it/s]

neg tensor(0.9771, grad_fn=<MeanBackward0>)
pos tensor(0.9266, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9808, grad_fn=<MeanBackward0>)
pos tensor(0.9795, grad_fn=<MeanBackward0>)
neg tensor(0.9606, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9843, grad_fn=<MeanBackward0>)
pos tensor(0.9846, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9828, grad_fn=<MeanBackward0>)
pos tensor(0.9626, grad_fn=<MeanBackward0>)
neg tensor(0.8923, grad_fn=<MeanBackward0>)
pos tensor(0.9632, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9945, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.8857, grad_fn=<Mean

Training:  42%|█████████████████████████████████████████████████████████████████                                                                                         | 571/1352 [02:19<03:00,  4.33it/s]

pos tensor(0.9570, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9863, grad_fn=<MeanBackward0>)
pos tensor(0.9895, grad_fn=<MeanBackward0>)
neg tensor(0.8889, grad_fn=<MeanBackward0>)
pos tensor(0.9962, grad_fn=<MeanBackward0>)
neg tensor(0.9897, grad_fn=<MeanBackward0>)
pos tensor(0.9875, grad_fn=<MeanBackward0>)
neg tensor(0.9823, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9557, grad_fn=<MeanBackward0>)
pos tensor(0.9567, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9953, grad_fn=<MeanBackward0>)
neg tensor(0.9307, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9864, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<Mean

Training:  42%|█████████████████████████████████████████████████████████████████▎                                                                                        | 573/1352 [02:19<02:58,  4.36it/s]

neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9893, grad_fn=<MeanBackward0>)
neg tensor(0.5953, grad_fn=<MeanBackward0>)
pos tensor(0.9964, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.9966, grad_fn=<MeanBackward0>)
pos tensor(0.9928, grad_fn=<MeanBackward0>)
neg tensor(0.7504, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9903, grad_fn=<MeanBackward0>)
pos tensor(0.9849, grad_fn=<MeanBackward0>)
neg tensor(0.9724, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9267, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.4225, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<Mean

Training:  42%|█████████████████████████████████████████████████████████████████▍                                                                                        | 574/1352 [02:19<03:19,  3.90it/s]

neg tensor(0.9852, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9851, grad_fn=<MeanBackward0>)
pos tensor(0.9653, grad_fn=<MeanBackward0>)
neg tensor(0.9729, grad_fn=<MeanBackward0>)
pos tensor(0.9793, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.8189, grad_fn=<MeanBackward0>)
pos tensor(0.9945, grad_fn=<MeanBackward0>)
neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9697, grad_fn=<MeanBackward0>)
pos tensor(0.9675, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9905, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9968, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.8800, grad_fn=<MeanBackward0>)
pos tensor(0.9515, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<Mean

Training:  43%|█████████████████████████████████████████████████████████████████▍                                                                                        | 575/1352 [02:20<03:13,  4.02it/s]

neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9819, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<MeanBackward0>)
pos tensor(0.9495, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9845, grad_fn=<MeanBackward0>)
neg tensor(0.9378, grad_fn=<MeanBackward0>)
pos tensor(0.9856, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.8757, grad_fn=<MeanBackward0>)
pos tensor(0.9742, grad_fn=<MeanBackward0>)
neg tensor(0.9854, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9829, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<Mean

Training:  43%|█████████████████████████████████████████████████████████████████▌                                                                                        | 576/1352 [02:20<03:02,  4.25it/s]

neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9916, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9566, grad_fn=<MeanBackward0>)
pos tensor(0.9786, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9900, grad_fn=<MeanBackward0>)
neg tensor(0.9844, grad_fn=<MeanBackward0>)
pos tensor(0.9906, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9892, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.9611, grad_fn=<MeanBackward0>)
pos tensor(0.9813, grad_fn=<MeanBackward0>)
neg tensor(0.8976, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9511, grad_fn=<MeanBackward0>)
pos tensor(0.9466, grad_fn=<MeanBackward0>)
neg tensor(0.9904, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9967, grad_fn=<Mean

Training:  43%|█████████████████████████████████████████████████████████████████▋                                                                                        | 577/1352 [02:20<03:06,  4.15it/s]

neg tensor(0.9377, grad_fn=<MeanBackward0>)
pos tensor(0.9843, grad_fn=<MeanBackward0>)
neg tensor(0.8026, grad_fn=<MeanBackward0>)
pos tensor(0.9716, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9735, grad_fn=<MeanBackward0>)
pos tensor(0.9501, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9585, grad_fn=<MeanBackward0>)
neg tensor(0.9931, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.8974, grad_fn=<MeanBackward0>)
pos tensor(0.9772, grad_fn=<MeanBackward0>)
neg tensor(0.9699, grad_fn=<MeanBackward0>)
pos tensor(0.9528, grad_fn=<MeanBackward0>)
neg tensor(0.9883, grad_fn=<Mean

Training:  43%|█████████████████████████████████████████████████████████████████▊                                                                                        | 578/1352 [02:20<03:06,  4.14it/s]

neg tensor(0.9641, grad_fn=<MeanBackward0>)
pos tensor(0.9844, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9818, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9805, grad_fn=<MeanBackward0>)
neg tensor(0.9901, grad_fn=<MeanBackward0>)
pos tensor(0.9811, grad_fn=<MeanBackward0>)
neg tensor(0.9752, grad_fn=<MeanBackward0>)
pos tensor(0.9672, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9681, grad_fn=<MeanBackward0>)
pos tensor(0.9296, grad_fn=<MeanBackward0>)
neg tensor(0.9874, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9749, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<Mean

Training:  43%|█████████████████████████████████████████████████████████████████▉                                                                                        | 579/1352 [02:21<03:20,  3.85it/s]

neg tensor(0.9654, grad_fn=<MeanBackward0>)
pos tensor(0.9667, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9785, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9739, grad_fn=<MeanBackward0>)
pos tensor(0.9750, grad_fn=<MeanBackward0>)
neg tensor(0.9827, grad_fn=<MeanBackward0>)
pos tensor(0.9808, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9800, grad_fn=<MeanBackward0>)
pos tensor(0.9794, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9854, grad_fn=<MeanBackward0>)
neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9891, grad_fn=<MeanBackward0>)
pos tensor(0.9777, grad_fn=<MeanBackward0>)
neg tensor(0.9910, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████                                                                                        | 580/1352 [02:21<03:14,  3.96it/s]

neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9112, grad_fn=<MeanBackward0>)
pos tensor(0.9886, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9779, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9822, grad_fn=<MeanBackward0>)
pos tensor(0.9868, grad_fn=<MeanBackward0>)
neg tensor(0.9875, grad_fn=<MeanBackward0>)
pos tensor(0.9865, grad_fn=<MeanBackward0>)
neg tensor(0.9517, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9671, grad_fn=<MeanBackward0>)
pos tensor(0.9892, grad_fn=<MeanBackward0>)
neg tensor(0.9958, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████▏                                                                                       | 581/1352 [02:21<03:21,  3.83it/s]

neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9882, grad_fn=<MeanBackward0>)
neg tensor(0.9895, grad_fn=<MeanBackward0>)
pos tensor(0.9836, grad_fn=<MeanBackward0>)
neg tensor(0.9964, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9967, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9855, grad_fn=<MeanBackward0>)
neg tensor(0.9786, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.7911, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9839, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9836, grad_fn=<MeanBackward0>)
pos tensor(0.9702, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9879, grad_fn=<MeanBackward0>)
neg tensor(0.9561, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████▎                                                                                       | 582/1352 [02:21<03:10,  4.05it/s]

neg tensor(0.9928, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9866, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.9913, grad_fn=<MeanBackward0>)
pos tensor(0.9828, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9921, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9782, grad_fn=<MeanBackward0>)
pos tensor(0.9885, grad_fn=<MeanBackward0>)
neg tensor(0.9628, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████▍                                                                                       | 583/1352 [02:22<03:23,  3.79it/s]

neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9842, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9838, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.9967, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9903, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9805, grad_fn=<MeanBackward0>)
pos tensor(0.9698, grad_fn=<MeanBackward0>)
neg tensor(0.9431, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████▌                                                                                       | 584/1352 [02:22<03:14,  3.95it/s]

neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9955, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9833, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9657, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9967, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9949, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9888, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<MeanBackward0>)
pos tensor(0.9743, grad_fn=<MeanBackward0>)
neg tensor(0.7711, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9928, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████▋                                                                                       | 585/1352 [02:22<03:01,  4.22it/s]

neg tensor(0.9929, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9948, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9972, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9874, grad_fn=<MeanBackward0>)
neg tensor(0.9969, grad_fn=<MeanBackward0>)
pos tensor(0.9945, grad_fn=<MeanBackward0>)
neg tensor(0.9845, grad_fn=<MeanBackward0>)
pos tensor(0.9867, grad_fn=<MeanBackward0>)
neg tensor(0.9947, grad_fn=<MeanBackward0>)
pos tensor(0.9898, grad_fn=<MeanBackward0>)
neg tensor(0.9855, grad_fn=<MeanBackward0>)
pos tensor(0.9803, grad_fn=<MeanBackward0>)
neg tensor(0.9570, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9759, grad_fn=<MeanBackward0>)
pos tensor(0.9598, grad_fn=<MeanBackward0>)
neg tensor(0.9811, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9958, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████▋                                                                                       | 586/1352 [02:22<03:23,  3.76it/s]

neg tensor(0.9971, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9711, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9946, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9918, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9966, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9829, grad_fn=<MeanBackward0>)
pos tensor(0.9748, grad_fn=<MeanBackward0>)
neg tensor(0.9964, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9887, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████▊                                                                                       | 587/1352 [02:23<03:31,  3.63it/s]

neg tensor(0.9158, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9789, grad_fn=<MeanBackward0>)
neg tensor(0.9923, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9890, grad_fn=<MeanBackward0>)
neg tensor(0.9966, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9950, grad_fn=<MeanBackward0>)
pos tensor(0.9901, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9920, grad_fn=<MeanBackward0>)
pos tensor(0.9859, grad_fn=<MeanBackward0>)
neg tensor(0.9959, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9560, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<Mean

Training:  43%|██████████████████████████████████████████████████████████████████▉                                                                                       | 588/1352 [02:23<03:31,  3.60it/s]

neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9972, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9853, grad_fn=<MeanBackward0>)
pos tensor(0.9771, grad_fn=<MeanBackward0>)
neg tensor(0.9970, grad_fn=<MeanBackward0>)
pos tensor(0.9966, grad_fn=<MeanBackward0>)
neg tensor(0.9967, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9820, grad_fn=<MeanBackward0>)
pos tensor(0.9732, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9945, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9881, grad_fn=<MeanBackward0>)
neg tensor(0.9746, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9679, grad_fn=<Mean

Training:  44%|███████████████████████████████████████████████████████████████████                                                                                       | 589/1352 [02:23<03:23,  3.76it/s]

neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9962, grad_fn=<MeanBackward0>)
neg tensor(0.9972, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9944, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9841, grad_fn=<MeanBackward0>)
pos tensor(0.9965, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9945, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.8789, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9899, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<Mean

Training:  44%|███████████████████████████████████████████████████████████████████▏                                                                                      | 590/1352 [02:23<03:11,  3.98it/s]

neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9198, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.9969, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9936, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9938, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9810, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9788, grad_fn=<MeanBackward0>)
pos tensor(0.9878, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.3263, grad_fn=<MeanBackward0>)
pos tensor(0.9052, grad_fn=<MeanBackward0>)
neg tensor(0.7797, grad_fn=<Mean

Training:  44%|███████████████████████████████████████████████████████████████████▎                                                                                      | 591/1352 [02:24<03:00,  4.21it/s]

neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9803, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9939, grad_fn=<MeanBackward0>)
pos tensor(0.9915, grad_fn=<MeanBackward0>)
neg tensor(0.9914, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9822, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.9967, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.8274, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.7963, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9922, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBack

Training:  44%|███████████████████████████████████████████████████████████████████▍                                                                                      | 592/1352 [02:24<03:01,  4.18it/s]

neg tensor(0.9971, grad_fn=<MeanBackward0>)
pos tensor(0.9950, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9947, grad_fn=<MeanBackward0>)
neg tensor(0.7922, grad_fn=<MeanBackward0>)
pos tensor(0.9830, grad_fn=<MeanBackward0>)
neg tensor(0.9912, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9926, grad_fn=<MeanBackward0>)
pos tensor(0.9967, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9913, grad_fn=<MeanBackward0>)
neg tensor(0.9933, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9963, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.7962, grad_fn=<Mean

Training:  44%|███████████████████████████████████████████████████████████████████▌                                                                                      | 593/1352 [02:24<03:04,  4.12it/s]

neg tensor(-0.3445, grad_fn=<MeanBackward0>)
pos tensor(0.9688, grad_fn=<MeanBackward0>)
neg tensor(0.9916, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.6621, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9839, grad_fn=<MeanBackward0>)
pos tensor(0.9832, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9921, grad_fn=<MeanBackward0>)
neg tensor(0.9731, grad_fn=<MeanBackward0>)
pos tensor(0.9826, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9963, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9853, grad_fn=<MeanBackward0>)
neg tensor(0.9973, grad_fn=<MeanBackward0>)
pos tensor(0.9943, grad_fn=<MeanBackward0>)
neg tensor(0.9968, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9932, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<Mea

Training:  44%|███████████████████████████████████████████████████████████████████▋                                                                                      | 594/1352 [02:24<03:02,  4.14it/s]

neg tensor(0.9893, grad_fn=<MeanBackward0>)
pos tensor(0.9825, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9959, grad_fn=<MeanBackward0>)
neg tensor(0.9922, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9966, grad_fn=<MeanBackward0>)
pos tensor(0.9934, grad_fn=<MeanBackward0>)
neg tensor(0.9971, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9722, grad_fn=<MeanBackward0>)
pos tensor(0.9966, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9919, grad_fn=<MeanBackward0>)
neg tensor(0.9943, grad_fn=<MeanBackward0>)
pos tensor(0.9954, grad_fn=<MeanBackward0>)
neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.6867, grad_fn=<MeanBackward0>)
pos tensor(1., grad_fn=<MeanBackward0>)
neg tensor(0.9870, grad_fn=<MeanBack

Training:  44%|███████████████████████████████████████████████████████████████████▊                                                                                      | 595/1352 [02:25<03:01,  4.16it/s]

neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9943, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9929, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9966, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.6815, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9768, grad_fn=<MeanBackward0>)
pos tensor(0.9975, grad_fn=<MeanBackward0>)
neg tensor(0.9911, grad_fn=<MeanBackward0>)
pos tensor(0.9850, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9918, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9926, grad_fn=<MeanBackward0>)
neg tensor(0.9915, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<Mean

Training:  44%|███████████████████████████████████████████████████████████████████▉                                                                                      | 596/1352 [02:25<02:57,  4.26it/s]

neg tensor(0.8758, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.5624, grad_fn=<MeanBackward0>)
pos tensor(0.9864, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9412, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9848, grad_fn=<MeanBackward0>)
pos tensor(0.9861, grad_fn=<MeanBackward0>)
neg tensor(0.9972, grad_fn=<MeanBackward0>)
pos tensor(0.9942, grad_fn=<MeanBackward0>)
neg tensor(0.9885, grad_fn=<MeanBackward0>)
pos tensor(0.9862, grad_fn=<MeanBackward0>)
neg tensor(0.9887, grad_fn=<MeanBackward0>)
pos tensor(0.9957, grad_fn=<MeanBackward0>)
neg tensor(0.9968, grad_fn=<MeanBackward0>)
pos tensor(0.9943, grad_fn=<MeanBackward0>)
neg tensor(0.9971, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<Mean

Training:  44%|████████████████████████████████████████████████████████████████████                                                                                      | 597/1352 [02:25<02:42,  4.64it/s]

neg tensor(0.9783, grad_fn=<MeanBackward0>)
pos tensor(0.9871, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9763, grad_fn=<MeanBackward0>)
pos tensor(0.9884, grad_fn=<MeanBackward0>)
neg tensor(0.9927, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.8051, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.7508, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9939, grad_fn=<MeanBackward0>)
neg tensor(0.9568, grad_fn=<MeanBackward0>)
pos tensor(0.9946, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<MeanBackward0>)
pos tensor(0.9974, grad_fn=<MeanBackward0>)
neg tensor(0.9908, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9831, grad_fn=<Mean

Training:  44%|████████████████████████████████████████████████████████████████████                                                                                      | 598/1352 [02:25<02:40,  4.69it/s]

pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9949, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9969, grad_fn=<MeanBackward0>)
pos tensor(0.9953, grad_fn=<MeanBackward0>)
neg tensor(0.9930, grad_fn=<MeanBackward0>)
pos tensor(0.9902, grad_fn=<MeanBackward0>)
neg tensor(0.9203, grad_fn=<MeanBackward0>)
pos tensor(0.9904, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9945, grad_fn=<MeanBackward0>)


Training:  44%|████████████████████████████████████████████████████████████████████▏                                                                                     | 599/1352 [02:25<02:53,  4.33it/s]

neg tensor(0.9965, grad_fn=<MeanBackward0>)
pos tensor(0.9945, grad_fn=<MeanBackward0>)
neg tensor(0.9964, grad_fn=<MeanBackward0>)
pos tensor(0.9925, grad_fn=<MeanBackward0>)
neg tensor(0.9951, grad_fn=<MeanBackward0>)
pos tensor(0.9917, grad_fn=<MeanBackward0>)
neg tensor(0.9880, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9934, grad_fn=<MeanBackward0>)
pos tensor(0.9857, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9869, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<MeanBackward0>)
pos tensor(0.9937, grad_fn=<MeanBackward0>)
neg tensor(0.9429, grad_fn=<MeanBackward0>)
pos tensor(0.9797, grad_fn=<MeanBackward0>)
neg tensor(0.9900, grad_fn=<MeanBackward0>)
pos tensor(0.9891, grad_fn=<MeanBackward0>)
neg tensor(0.9976, grad_fn=<MeanBackward0>)
pos tensor(0.9953, grad_fn=<MeanBackward0>)
neg tensor(0.9941, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9741, grad_fn=<Mean

Training:  44%|████████████████████████████████████████████████████████████████████▎                                                                                     | 600/1352 [02:26<02:56,  4.27it/s]

neg tensor(0.9646, grad_fn=<MeanBackward0>)
pos tensor(0.9981, grad_fn=<MeanBackward0>)
neg tensor(0.9705, grad_fn=<MeanBackward0>)
pos tensor(0.9775, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9897, grad_fn=<MeanBackward0>)
neg tensor(0.8875, grad_fn=<MeanBackward0>)
pos tensor(0.9960, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9914, grad_fn=<MeanBackward0>)
neg tensor(0.9721, grad_fn=<MeanBackward0>)
pos tensor(0.9530, grad_fn=<MeanBackward0>)
neg tensor(0.7410, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9821, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9976, grad_fn=<MeanBackward0>)
pos tensor(0.9952, grad_fn=<MeanBackward0>)
neg tensor(0.9935, grad_fn=<MeanBackward0>)
pos tensor(0.9888, grad_fn=<MeanBackward0>)
neg tensor(0.9925, grad_fn=<MeanBackward0>)
pos tensor(0.9932, grad_fn=<MeanBackward0>)
neg tensor(0.9967, grad_fn=<Mean

Training:  44%|████████████████████████████████████████████████████████████████████▍                                                                                     | 601/1352 [02:26<02:54,  4.30it/s]

neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9656, grad_fn=<MeanBackward0>)
pos tensor(0.9971, grad_fn=<MeanBackward0>)
neg tensor(0.9879, grad_fn=<MeanBackward0>)
pos tensor(0.9954, grad_fn=<MeanBackward0>)
neg tensor(0.9862, grad_fn=<MeanBackward0>)
pos tensor(0.9863, grad_fn=<MeanBackward0>)
neg tensor(0.9898, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9340, grad_fn=<MeanBackward0>)
pos tensor(0.9360, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9911, grad_fn=<MeanBackward0>)
neg tensor(0.9867, grad_fn=<MeanBackward0>)
pos tensor(0.9740, grad_fn=<MeanBackward0>)
neg tensor(0.9957, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9936, grad_fn=<MeanBackward0>)
neg tensor(0.9952, grad_fn=<MeanBackward0>)
pos tensor(0.9933, grad_fn=<MeanBackward0>)
neg tensor(0.9747, grad_fn=<Mean

Training:  45%|████████████████████████████████████████████████████████████████████▌                                                                                     | 602/1352 [02:26<03:02,  4.10it/s]

neg tensor(0.9909, grad_fn=<MeanBackward0>)
pos tensor(0.9851, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9923, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9957, grad_fn=<MeanBackward0>)
neg tensor(0.8819, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9832, grad_fn=<MeanBackward0>)
pos tensor(0.9657, grad_fn=<MeanBackward0>)
neg tensor(0.9942, grad_fn=<MeanBackward0>)
pos tensor(0.9908, grad_fn=<MeanBackward0>)
neg tensor(0.9473, grad_fn=<MeanBackward0>)
pos tensor(0.9711, grad_fn=<MeanBackward0>)
neg tensor(0.9969, grad_fn=<MeanBackward0>)
pos tensor(0.9944, grad_fn=<MeanBackward0>)
neg tensor(0.9860, grad_fn=<MeanBackward0>)
pos tensor(0.9710, grad_fn=<MeanBackward0>)
neg tensor(0.9955, grad_fn=<MeanBackward0>)
pos tensor(0.9931, grad_fn=<MeanBackward0>)
neg tensor(0.9961, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9953, grad_fn=<Mean

Training:  45%|████████████████████████████████████████████████████████████████████▋                                                                                     | 603/1352 [02:26<03:03,  4.08it/s]

neg tensor(0.2603, grad_fn=<MeanBackward0>)
pos tensor(0.9938, grad_fn=<MeanBackward0>)
neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9909, grad_fn=<MeanBackward0>)
neg tensor(0.9726, grad_fn=<MeanBackward0>)
pos tensor(0.9678, grad_fn=<MeanBackward0>)
neg tensor(0.8295, grad_fn=<MeanBackward0>)
pos tensor(0.9930, grad_fn=<MeanBackward0>)
neg tensor(0.9917, grad_fn=<MeanBackward0>)
pos tensor(0.9907, grad_fn=<MeanBackward0>)
neg tensor(0.9969, grad_fn=<MeanBackward0>)
pos tensor(0.9942, grad_fn=<MeanBackward0>)
neg tensor(0.9924, grad_fn=<MeanBackward0>)
pos tensor(0.9912, grad_fn=<MeanBackward0>)
neg tensor(0.8590, grad_fn=<MeanBackward0>)
pos tensor(0.9969, grad_fn=<MeanBackward0>)
neg tensor(0.8958, grad_fn=<MeanBackward0>)
pos tensor(0.9969, grad_fn=<MeanBackward0>)
neg tensor(0.9969, grad_fn=<MeanBackward0>)
pos tensor(0.9952, grad_fn=<MeanBackward0>)
neg tensor(0.9868, grad_fn=<MeanBackward0>)
pos tensor(0.9927, grad_fn=<MeanBackward0>)
neg tensor(0.9878, grad_fn=<Mean

Training:  45%|████████████████████████████████████████████████████████████████████▊                                                                                     | 604/1352 [02:27<02:57,  4.21it/s]

neg tensor(0.9940, grad_fn=<MeanBackward0>)
pos tensor(0.9910, grad_fn=<MeanBackward0>)
neg tensor(0.9789, grad_fn=<MeanBackward0>)
pos tensor(0.9709, grad_fn=<MeanBackward0>)
neg tensor(0.9859, grad_fn=<MeanBackward0>)
pos tensor(0.9817, grad_fn=<MeanBackward0>)
neg tensor(0.9882, grad_fn=<MeanBackward0>)
pos tensor(0.9941, grad_fn=<MeanBackward0>)
neg tensor(0.9954, grad_fn=<MeanBackward0>)
pos tensor(0.9951, grad_fn=<MeanBackward0>)
neg tensor(0.9873, grad_fn=<MeanBackward0>)
pos tensor(0.9873, grad_fn=<MeanBackward0>)
neg tensor(0.9364, grad_fn=<MeanBackward0>)
pos tensor(0.9958, grad_fn=<MeanBackward0>)
neg tensor(0.9889, grad_fn=<MeanBackward0>)
pos tensor(0.9899, grad_fn=<MeanBackward0>)
neg tensor(0.9700, grad_fn=<MeanBackward0>)
pos tensor(0.9940, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9739, grad_fn=<MeanBackward0>)
neg tensor(0.9830, grad_fn=<MeanBackward0>)
pos tensor(0.9948, grad_fn=<MeanBackward0>)
neg tensor(0.9765, grad_fn=<Mean

Training:  45%|████████████████████████████████████████████████████████████████████▉                                                                                     | 605/1352 [02:27<02:51,  4.36it/s]

neg tensor(0.9884, grad_fn=<MeanBackward0>)
pos tensor(0.9792, grad_fn=<MeanBackward0>)
neg tensor(0.9937, grad_fn=<MeanBackward0>)
pos tensor(0.9894, grad_fn=<MeanBackward0>)
neg tensor(0.9406, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9960, grad_fn=<MeanBackward0>)
pos tensor(0.9935, grad_fn=<MeanBackward0>)
neg tensor(0.9877, grad_fn=<MeanBackward0>)
pos tensor(0.9880, grad_fn=<MeanBackward0>)
neg tensor(0.9956, grad_fn=<MeanBackward0>)
pos tensor(0.9924, grad_fn=<MeanBackward0>)
neg tensor(0.9155, grad_fn=<MeanBackward0>)
pos tensor(1.0000, grad_fn=<MeanBackward0>)
neg tensor(0.9696, grad_fn=<MeanBackward0>)
pos tensor(0.9802, grad_fn=<MeanBackward0>)
neg tensor(0.9781, grad_fn=<MeanBackward0>)
pos tensor(0.9621, grad_fn=<MeanBackward0>)
neg tensor(0.9449, grad_fn=<MeanBackward0>)
pos tensor(0.9964, grad_fn=<MeanBackward0>)
neg tensor(0.9962, grad_fn=<MeanBackward0>)
pos tensor(0.9947, grad_fn=<MeanBackward0>)
neg tensor(0.9792, grad_fn=<Mean

Training:  45%|████████████████████████████████████████████████████████████████████▉                                                                                     | 605/1352 [02:27<03:02,  4.10it/s]


KeyboardInterrupt: 

In [115]:
print(data_train[0].assoc)

[0, 1, 4, 4, 6, 1, 3, 5, 8, 3, 8, 9, 6, 9, 7, 7, 7, 2, 2, 7, 2, 2, 2, 2]


In [116]:
print(data_train[0].scores)

tensor([[1.1253e-02, 8.4718e-01, 9.9000e-01, 9.9333e-01],
        [1.1642e-05, 9.9926e-01, 9.9984e-01, 1.0000e+00],
        [1.2327e-01, 8.9402e-01, 9.6672e-01, 9.9460e-01],
        [8.1988e-05, 9.9914e-01, 9.9998e-01, 9.9973e-01],
        [8.5032e-04, 9.9523e-01, 9.8610e-01, 9.9714e-01],
        [1.9214e-02, 8.2967e-01, 9.9145e-01, 1.0000e+00],
        [6.9019e-03, 8.9194e-01, 9.8285e-01, 9.9922e-01],
        [1.1938e-03, 9.6392e-01, 9.9540e-01, 9.9636e-01],
        [8.6120e-03, 9.5292e-01, 9.3557e-01, 9.7343e-01],
        [2.3544e-01, 5.0414e-01, 9.0548e-01, 7.5158e-01],
        [3.5325e-01, 6.7075e-01, 5.9460e-01, 9.6007e-01],
        [7.9414e-03, 9.9043e-01, 9.6820e-01, 9.9665e-01],
        [2.2113e-01, 3.9131e-01, 8.6227e-01, 1.0000e+00],
        [2.4336e-01, 6.1869e-01, 8.0649e-01, 1.0000e+00],
        [1.6545e-04, 9.9834e-01, 9.9997e-01, 9.9731e-01],
        [0.0000e+00, 1.0000e+00, 1.0000e+00, 1.0000e+00],
        [4.9914e-03, 9.7373e-01, 1.0000e+00, 1.0000e+00],
        [0.000

In [117]:
print(data_train[0].links)

tensor([[0., 3., 8., 5.],
        [1., 9., 4., 0.],
        [4., 3., 6., 8.],
        [4., 7., 9., 6.],
        [6., 9., 5., 3.],
        [1., 9., 2., 0.],
        [3., 0., 8., 5.],
        [5., 8., 0., 6.],
        [8., 5., 0., 3.],
        [3., 8., 5., 0.],
        [8., 3., 0., 5.],
        [9., 6., 8., 5.],
        [6., 9., 5., 0.],
        [9., 1., 2., 0.],
        [7., 4., 2., 9.],
        [7., 0., 1., 2.],
        [7., 4., 0., 1.],
        [2., 0., 1., 3.],
        [2., 9., 7., 0.],
        [7., 0., 1., 2.],
        [2., 7., 0., 1.],
        [2., 0., 1., 3.],
        [2., 7., 9., 0.],
        [2., 7., 9., 0.]])
