In [1]:
!git clone https://github.com/rafikg/CEAL.git

Cloning into 'CEAL'...
remote: Enumerating objects: 395, done.[K
remote: Counting objects: 100% (53/53), done.[K
remote: Compressing objects: 100% (38/38), done.[K
remote: Total 395 (delta 11), reused 46 (delta 8), pack-reused 342[K
Receiving objects: 100% (395/395), 241.62 KiB | 2.12 MiB/s, done.
Resolving deltas: 100% (181/181), done.


In [2]:
from torch.utils.data import DataLoader
from torchvision import transforms
from torch.utils.data.sampler import SubsetRandomSampler
from typing import Optional, Callable, Union
from torch.utils.data import Dataset
import os
import glob
import cv2
import numpy as np
import torch
import logging


In [3]:
from typing import Tuple

def get_high_confidence_samples(pred_prob: np.ndarray,
                                delta: float) -> Tuple[np.ndarray, np.ndarray]:
    """
    Select high confidence samples from `D^U` whose entropy is smaller than
     the threshold
    `delta`.

    Parameters
    ----------
    pred_prob : np.ndarray
        prediction probability of x_i with dimension (batch x n_class)
    delta : float
        threshold

    Returns
    -------
    np.array with dimension (K x 1)  containing the indices of the K
        most informative samples.
    np.array with dimension (K x 1) containing the predicted classes of the
        k most informative samples
    """
    _, eni = entropy(pred_prob=pred_prob, k=len(pred_prob))
    hcs = eni[eni[:, 2] < delta]
    return hcs[:, 0].astype(np.int32), hcs[:, 1].astype(np.int32)


def get_uncertain_samples(pred_prob: np.ndarray, k: int,
                          criteria: str) -> Tuple[np.ndarray, np.ndarray]:
    """
    Get the K most informative samples based on the criteria
    Parameters
    ----------
    pred_prob : np.ndarray
        prediction probability of x_i with dimension (batch x n_class)
    k: int
    criteria: str
        `cl` : least_confidence()
        `ms` : margin_sampling()
        `en` : entropy

    Returns
    -------
    tuple(np.ndarray, np.ndarray)
    """
    if criteria == 'cl':
        uncertain_samples = least_confidence(pred_prob=pred_prob, k=k)
    elif criteria == 'ms':
        uncertain_samples = margin_sampling(pred_prob=pred_prob, k=k)
    elif criteria == 'en':
        uncertain_samples = entropy(pred_prob=pred_prob, k=k)
    else:
        raise ValueError('criteria {} not found !'.format(criteria))
    return uncertain_samples


In [4]:
# Authors rafik gouiaa <rafikgouiaaphd@gmail.com>, ...
from typing import Tuple
import numpy as np


def least_confidence(pred_prob: np.ndarray, k: int) -> Tuple[np.ndarray,
                                                             np.ndarray]:
    f"""
    Rank all the unlabeled samples in an ascending order according to
    equation 2

    Parameters
    ----------
    pred_prob : prediction probability of x_i with dimension (batch x n_class)
    k : int
        most informative samples
    Returns
    -------
    np.array with dimension (K x 1) containing the indices of the K
        most informative samples.
    np.array with dimension (K x 3) containing the indices, the predicted class
        and the `lc` of the k most informative samples
        column 1: indices
        column 2: predicted class.
        column 3: lc
    """
    assert np.round(pred_prob.sum(1).sum()) == pred_prob.shape[
        0], "pred_prob is not " \
            "a probability" \
            " distribution"
    assert 0 < k <= pred_prob.shape[0], "invalid k value k should be >0 &" \
                                        "k <=  pred_prob.shape[0"
    # Get max probabilities prediction and its corresponding classes
    most_pred_prob, most_pred_class = np.max(pred_prob, axis=1), np.argmax(
        pred_prob, axis=1)
    size = len(pred_prob)
    lc_i = np.column_stack(
        (list(range(size)), most_pred_class, most_pred_prob))
    # sort lc_i in ascending order
    lc_i = lc_i[lc_i[:, -1].argsort()]

    return lc_i[:k, 0].astype(np.int32), lc_i[:k]


def margin_sampling(pred_prob: np.ndarray, k: int) -> Tuple[np.ndarray,
                                                            np.ndarray]:
    f"""
    Rank all the unlabeled samples in an ascending order according to the
    equation 3
    ----------
    pred_prob : np.ndarray
        prediction probability of x_i with dimension (batch x n_class)
    k : int
        most informative samples

    Returns
    -------
    np.array with dimension (K x 1)  containing the indices of the K
        most informative samples.
    np.array with dimension (K x 3) containing the indices, the predicted class
        and the `ms_i` of the k most informative samples
        column 1: indices
        column 2: predicted class.
        column 3: margin sampling
    """
    assert np.round(pred_prob.sum(1).sum()) == pred_prob.shape[
        0], "pred_prob is not " \
            "a probability" \
            " distribution"
    assert 0 < k <= pred_prob.shape[0], "invalid k value k should be >0 &" \
                                        "k <=  pred_prob.shape[0"
    # Sort pred_prob to get j1 and j2
    size = len(pred_prob)
    margin = np.diff(np.abs(np.sort(pred_prob, axis=1)[:, ::-1][:, :2]))
    pred_class = np.argmax(pred_prob, axis=1)
    ms_i = np.column_stack((list(range(size)), pred_class, margin))

    # sort ms_i in ascending order according to margin
    ms_i = ms_i[ms_i[:, 2].argsort()]

    # the smaller the margin  means the classifier is more
    # uncertain about the sample
    return ms_i[:k, 0].astype(np.int32), ms_i[:k]


def entropy(pred_prob: np.ndarray, k: int) -> Tuple[np.ndarray, np.ndarray]:
    f"""
    Rank all the unlabeled samples in an descending order according to
    the equation 4

    Parameters
    ----------
    pred_prob : np.ndarray
        prediction probability of x_i with dimension (batch x n_class)
    k : int

    Returns
    -------
    np.array with dimension (K x 1)  containing the indices of the K
        most informative samples.
    np.array with dimension (K x 3) containing the indices, the predicted class
        and the `en_i` of the k most informative samples
        column 1: indices
        column 2: predicted class.
        column 3: entropy

    """
    # calculate the entropy for the pred_prob
    assert np.round(pred_prob.sum(1).sum()) == pred_prob.shape[
        0], "pred_prob is not " \
            "a probability" \
            " distribution"
    assert 0 < k <= pred_prob.shape[0], "invalid k value k should be >0 &" \
                                        "k <=  pred_prob.shape[0"
    size = len(pred_prob)
    entropy_ = - np.nansum(pred_prob * np.log(pred_prob), axis=1)
    pred_class = np.argmax(pred_prob, axis=1)
    en_i = np.column_stack((list(range(size)), pred_class, entropy_))

    # Sort en_i in descending order
    en_i = en_i[(-1 * en_i[:, 2]).argsort()]
    return en_i[:k, 0].astype(np.int32), en_i[:k]


In [5]:
# Authors: rafik gouiaa <rafikgouiaaphd@gmail.com>, ...

from typing import Optional, Callable

from torchvision.models import alexnet
from torch.utils.data import DataLoader
from torch.nn.functional import softmax
import numpy as np
import torch.nn as nn
import torch.optim as optim
import torch
import torch.optim as Optimizer
from tqdm import tqdm

class AlexNet(object):
    """
    Encapsulate the pretrained alexnet model
    Parameters
    ----------
    n_classes : int, default(10)
        the new number of classes
    device: Optional[str] 'cuda' or 'cpu', default(None)
            if None: cuda will be used if it is available
    """

    def __init__(self, n_classes: int = 10, device: Optional[str] = None):

        self.n_classes = n_classes
        self.model = alexnet(pretrained=True, progress=True)

        ## freeze_all_layers
        for param in self.model.parameters():
            param.requires_grad = False

        ## change last layer to accept n_classes instead of 1000 classes
        self.model.classifier[6] = nn.Linear(4096, self.n_classes)

        ## Add softmax layer to alexnet model
        self.model = nn.Sequential(self.model, nn.LogSoftmax(dim=1))

        if device is None:
            self.device = torch.device(
                "cuda:0" if torch.cuda.is_available() else "cpu")
        print('The code is running on {} '.format(self.device))

        # print(self.model)



    def __train_one_epoch(self, train_loader: DataLoader,
                          optimizer: Optimizer,
                          criterion: Callable,
                          valid_loader: DataLoader = None,
                          epoch: int = 0,
                          each_batch_idx: int = 300) -> None:
        """
        Train alexnet for one epoch
        Parameters
        ----------
        train_loader : DataLoader
        criterion :  Callable
        optimizer : Optimizer (torch.optim)
        epoch : int
        each_batch_idx : int
            print training stats after each_batch_idx

        Returns
        -------
        None
        """
        train_loss = 0
        data_size = 0
        print("Training ...")
        for batch_idx, sample_batched in tqdm(enumerate(train_loader)):
            # load data and label
            data, label = sample_batched['image'], sample_batched['label']

            # convert data and label to be compatible with the device
            data = data.to(self.device)
            data = data.float()
            label = label.to(self.device)

            # zero the parameter gradients
            optimizer.zero_grad()

            # run forward
            pred_prob = self.model(data)

            # calculate loss
            loss = criterion(pred_prob, label)

            # calculate gradient (backprop)
            loss.backward()

            # total train loss
            train_loss += loss.item()
            data_size += label.size(0)

            # update weights
            optimizer.step()

            if batch_idx % each_batch_idx == 0:
                print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                    epoch, batch_idx * len(data),
                    len(train_loader.sampler.indices),
                    100. * batch_idx / len(train_loader.sampler.indices),
                    loss.item()))
        if valid_loader:
            acc = self.evaluate(test_loader=valid_loader)
            print('Accuracy on the valid dataset {}'.format(acc))

        print('====> Epoch: {} Average loss: {:.4f}'.
              format(epoch,
                     train_loss / data_size))

    def train(self, epochs: int, train_loader: DataLoader,
              valid_loader: DataLoader = None) -> None:
        """
        Train alexnet for several epochs
        Parameters
        ----------
        epochs : int
            number of epochs
        train_loader:  DataLoader
            training set
        valid_loader : DataLoader, Optional

        Returns
        -------
        None
        """
        self.model.to(self.device)
        self.model.train()
        optimizer = optim.SGD(
            filter(lambda p: p.requires_grad, self.model.parameters()),
            lr=0.001, momentum=0.9)

        criterion = nn.CrossEntropyLoss()
        for epoch in range(epochs):
            self.__train_one_epoch(train_loader=train_loader,
                                   optimizer=optimizer,
                                   criterion=criterion,
                                   valid_loader=valid_loader,
                                   epoch=epoch
                                   )

    def evaluate(self, test_loader: DataLoader) -> float:
        """
        Calaculate alexnet accuracy on test data
        Parameters
        ----------
        test_loader: DataLoader

        Returns
        -------
        accuracy: float
        """
        correct = 0
        total = 0
        print("Evaluation ...")
        with torch.no_grad():
            for batch_idx, sample_batched in tqdm(enumerate(test_loader)):
                data, labels = sample_batched['image'], \
                               sample_batched['label']
                data = data.to(self.device)
                data = data.float()
                labels = labels.to(self.device)
                outputs = self.model(data)
                _, predicted = torch.max(outputs.data, 1)
                total += labels.size(0)
                correct += (predicted == labels).sum().item()
        return 100 * correct / total

    def predict(self, test_loader):
        """
        Run the inference pipeline on the test_loader data
        Parameters
        ----------
        test_loader: DataLoader
            test data

        Returns
        -------

        """
        self.model.eval()
        self.model.to(self.device)
        predict_results = np.empty(shape=(0, 10))
        print("Prediction on Unlabelled Data ...")
        with torch.no_grad():
            for batch_idx, sample_batched in tqdm(enumerate(test_loader)):
                data, _ = sample_batched['image'], \
                          sample_batched['label']
                data = data.to(self.device)
                data = data.float()
                outputs = self.model(data)
                outputs = softmax(outputs)
                predict_results = np.concatenate(
                    (predict_results, outputs.cpu().numpy()))
        return predict_results


## Dataset

In [6]:
pwd

'/content'

In [7]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [8]:
mkdir data

In [9]:
!git clone https://github.com/teavanist/MNIST-JPG.git

Cloning into 'MNIST-JPG'...
remote: Enumerating objects: 29, done.[K
remote: Counting objects: 100% (28/28), done.[K
remote: Compressing objects: 100% (19/19), done.[K
remote: Total 29 (delta 7), reused 27 (delta 7), pack-reused 1[K
Receiving objects: 100% (29/29), 17.53 MiB | 13.63 MiB/s, done.
Resolving deltas: 100% (7/7), done.


In [10]:
!unzip "/content/MNIST-JPG/MNIST Dataset JPG format.zip" -d /content/dataMnist

[1;30;43mStreaming output truncated to the last 5000 lines.[0m
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/18241.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/18251.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/1826.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/18277.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/18296.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/183.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/18350.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/18355.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/18374.jpg  
 extracting: /content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training/9/18377.jpg 

In [11]:
!unzip "/content/data/train-images.idx3-ubyte" -d /content/data/train-images

unzip:  cannot find or open /content/data/train-images.idx3-ubyte, /content/data/train-images.idx3-ubyte.zip or /content/data/train-images.idx3-ubyte.ZIP.


In [None]:
# os.system("rm -rf /content/data/256_ObjectCategories/257.clutter")

0

In [None]:
# !pip install patool
# import patoolib




In [None]:
# patoolib.extract_archive("/content/drive/MyDrive/Data/project/mnist/MNIST_ORG.zip",outdir="/content/data")

In [12]:
%%writefile divide_data.sh

# This script is to divide the dataset into 80% 20%
echo "If you run this script on linux, change gshuf with shuf "
base_folder="/content/data/mnist_test_custom/"

mkdir -p "$base_folder"

for dir in "/content/data/trainingSet"*
do

  subdir=$(basename "$dir")

  mkdir -p "$base_folder$subdir"

  count=$(ls "$dir" | wc -l)

  tenpercent=$(expr $count '*' 20 '/' 100)

  ls "$dir" | shuf -n "$tenpercent" | xargs -I {} mv "$dir"/{} "$base_folder$subdir"

done


Writing divide_data.sh


## to split the data

In [13]:
!bash divide_data.sh

If you run this script on linux, change gshuf with shuf 
ls: cannot access '/content/data/trainingSet*': No such file or directory
ls: cannot access '/content/data/trainingSet*': No such file or directory


In [14]:

class mnistDataset(Dataset):
    """
    Encapsulate Caltech256 torch.utils.data.Dataset

    Parameters
    ----------
    root_dir : str
        Path to the dataset directory.

    transform : Callable,
        A transform function that takes the original image and
        return a transformed version.

    Attributes
    ----------
    data : list
        list of images files names
    labels : list
        list of integers (labels)
    """

    def __init__(self, root_dir,
                 transform: Optional[Callable] = None):

        self.root_dir = os.path.expanduser(root_dir)
        self.transform = transform
        self.data = []
        self.labels = []
        self._classes = 10

        # load data and labels
        for cat in range(0, self._classes):
            cat_dir = glob.glob(
                os.path.join(self.root_dir, str(cat)))[0]

            for img_file in glob.glob(os.path.join(cat_dir, '*.jpg')):
                self.data.append(img_file)
                self.labels.append(cat)

    def __getitem__(self, idx: int) -> dict:
        """
        Get the idx element

        Parameters
        ----------
        idx : int
           the index of the element


        Returns
        -------
        sample: dict[str, Any]
        """
        img, label = self.data[idx], self.labels[idx]
        label = torch.tensor(label,dtype = torch.long)
        img = cv2.imread(img)
        img = img[:, :, ::-1]
        img = self.img_normalize(img).transpose(2, 0, 1)
        sample = {'image': img, 'label': label}

        if self.transform:
            sample['image'] = self.transform(torch.tensor(sample['image']))

        return sample

    def __len__(self):

        return len(self.data)

    @staticmethod
    def img_normalize(img):
        img = (img / 255.0)

        return img

In [15]:
def update_threshold(delta: float, dr: float, t: int) -> float:
    """
    Update the selection threshold of high confidence samples
    Parameters
    ----------
    delta
    dr
    t

    Returns
    -------

    """
    if t > 0:
        delta = delta - dr * t
    return delta


In [16]:
import os
# len(os.listdir("/content/data/256_ObjectCategories"))

In [17]:
from torch.utils.data import DataLoader
from torchvision import transforms
from torch.utils.data.sampler import SubsetRandomSampler

import numpy as np
import torch

def ceal_learning_algorithm(du: DataLoader,
                            dl: DataLoader,
                            dtest: DataLoader,
                            k: int = 1000,
                            delta_0: float = 0.00005,
                            dr: float = 0.000033,
                            t: int = 1,
                            epochs: int = 15,
                            criteria: str = 'cl',
                            max_iter: int = 25):
    """
    Algorithm1 : Learning algorithm of CEAL.
    For simplicity, I used the same notation in the paper.
    Parameters
    ----------
    du: DataLoader
        Unlabeled samples
    dl : DataLoader
        labeled samples
    dtest : DataLoader
        test data
    k: int, (default = 1000)
        uncertain samples selection
    delta_0: float
        hight confidence samples selection threshold
    dr: float
        threshold decay
    t: int
        fine-tuning interval
    epochs: int
    criteria: str
    max_iter: int
        maximum iteration number.

    Returns
    -------

    """
    print('Initial configuration: len(du): {}, len(dl): {} '.format(
        len(du.sampler.indices),
        len(dl.sampler.indices)))

    # Create the model
    model = AlexNet(n_classes=10, device=None)

    # Initialize the model
    print('Intialize training the model on `dl` and test on `dtest`')

    model.train(epochs=epochs, train_loader=dl, valid_loader=None)

    # Evaluate model on dtest
    acc = model.evaluate(test_loader=dtest)

    print('====> Initial accuracy: {} '.format(acc))

    for iteration in range(max_iter):

        print('Iteration: {}: run prediction on unlabeled data '
                    '`du` '.format(iteration))

        pred_prob = model.predict(test_loader=du)

        # get k uncertain samples
        uncert_samp_idx, _ = get_uncertain_samples(pred_prob=pred_prob, k=k,
                                                   criteria=criteria)

        # get original indices
        uncert_samp_idx = [du.sampler.indices[idx] for idx in uncert_samp_idx]

        # add the uncertain samples selected from `du` to the labeled samples
        #  set `dl`
        dl.sampler.indices.extend(uncert_samp_idx)

        print(
            'Update size of `dl`  and `du` by adding uncertain {} samples'
            ' in `dl`'
            ' len(dl): {}, len(du) {}'.
            format(len(uncert_samp_idx), len(dl.sampler.indices),
                   len(du.sampler.indices)))

        # get high confidence samples `dh`
        hcs_idx, hcs_labels = get_high_confidence_samples(pred_prob=pred_prob,
                                                          delta=delta_0)
        # get the original indices
        hcs_idx = [du.sampler.indices[idx] for idx in hcs_idx]

        # remove the samples that already selected as uncertain samples.
        hcs_idx = [x for x in hcs_idx if
                   x not in list(set(uncert_samp_idx) & set(hcs_idx))]

        # add high confidence samples to the labeled set 'dl'

        # (1) update the indices
        dl.sampler.indices.extend(hcs_idx)
        # (2) update the original labels with the pseudo labels.
        for idx in range(len(hcs_idx)):
            dl.dataset.labels[hcs_idx[idx]] = hcs_labels[idx]
        print(
            'Update size of `dl`  and `du` by adding {} hcs samples in `dl`'
            ' len(dl): {}, len(du) {}'.
            format(len(hcs_idx), len(dl.sampler.indices),
                   len(du.sampler.indices)))

        if iteration % t == 0:
            print('Iteration: {} fine-tune the model on dh U dl'.
                        format(iteration))
            model.train(epochs=epochs, train_loader=dl)

            # update delta_0
            delta_0 = update_threshold(delta=delta_0, dr=dr, t=iteration)

        # remove the uncertain samples from the original `du`
        print('remove {} uncertain samples from du'.
                    format(len(uncert_samp_idx)))
        for val in uncert_samp_idx:
            du.sampler.indices.remove(val)

        acc = model.evaluate(test_loader=dtest)
        print(
            "Iteration: {}, len(dl): {}, len(du): {},"
            " len(dh) {}, acc: {} ".format(
                iteration, len(dl.sampler.indices),
                len(du.sampler.indices), len(hcs_idx), acc))


if __name__ == "__main__":

    dataset_train = mnistDataset(
        root_dir="/content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - training",
        transform=transforms.Compose([transforms.ToPILImage(),
        # transforms.RandomResizedCrop((224,224)),
        # transforms.RandomResizedCrop((64,64)),
        transforms.Resize((150,150)),
        # transforms.RandomHorizontalFlip(),
        transforms.ToTensor()]))

    dataset_test = mnistDataset(
        root_dir="/content/dataMnist/MNIST Dataset JPG format/MNIST - JPG - testing",
        transform=transforms.Compose([transforms.ToPILImage(),
        # transforms.RandomResizedCrop((224,224)),
        # transforms.RandomResizedCrop((64,64)),
        transforms.Resize((150,150)),
        # transforms.RandomHorizontalFlip(),
        transforms.ToTensor()]))

    # Creating data indices for training and validation splits:
    random_seed = 123
    validation_split = 0.1  # 10%
    shuffling_dataset = True
    batch_size = 16
    dataset_size = len(dataset_train)

    indices = list(range(dataset_size))
    split = int(np.floor(validation_split * dataset_size))

    if shuffling_dataset:
        np.random.seed(random_seed)
        np.random.shuffle(indices)
    train_indices, val_indices = indices[split:], indices[:split]

    # Creating PT data samplers and loaders:
    train_sampler = SubsetRandomSampler(train_indices)
    valid_sampler = SubsetRandomSampler(val_indices)

    du = torch.utils.data.DataLoader(dataset_train, batch_size=batch_size,
                                     sampler=train_sampler, num_workers=4)
    dl = torch.utils.data.DataLoader(dataset_train, batch_size=batch_size,
                                     sampler=valid_sampler, num_workers=4)
    dtest = torch.utils.data.DataLoader(dataset_test, batch_size=batch_size,
                                        num_workers=4)

    ceal_learning_algorithm(du=du, dl=dl, dtest=dtest)




Initial configuration: len(du): 54000, len(dl): 6000 


Downloading: "https://download.pytorch.org/models/alexnet-owt-7be5be79.pth" to /root/.cache/torch/hub/checkpoints/alexnet-owt-7be5be79.pth
100%|██████████| 233M/233M [00:01<00:00, 136MB/s]


The code is running on cuda:0 
Intialize training the model on `dl` and test on `dtest`
Training ...


9it [00:06,  1.88it/s]



308it [00:13, 46.59it/s]



375it [00:15, 24.76it/s]

====> Epoch: 0 Average loss: 0.0343
Training ...



5it [00:00, 20.98it/s]



313it [00:05, 62.49it/s]



375it [00:06, 55.55it/s]

====> Epoch: 1 Average loss: 0.0214
Training ...



0it [00:00, ?it/s]



307it [00:05, 37.28it/s]



375it [00:07, 50.85it/s]

====> Epoch: 2 Average loss: 0.0177
Training ...



4it [00:00, 19.92it/s]



313it [00:06, 63.90it/s]



375it [00:07, 47.92it/s]

====> Epoch: 3 Average loss: 0.0171
Training ...



11it [00:00, 54.89it/s]



308it [00:05, 59.90it/s]



375it [00:06, 57.63it/s]

====> Epoch: 4 Average loss: 0.0152
Training ...



5it [00:00, 20.07it/s]



309it [00:07, 59.20it/s]



375it [00:08, 41.74it/s]

====> Epoch: 5 Average loss: 0.0152
Training ...



8it [00:00, 41.05it/s]



309it [00:05, 63.56it/s]



375it [00:06, 59.50it/s]

====> Epoch: 6 Average loss: 0.0146
Training ...



9it [00:00, 42.13it/s]



307it [00:07, 37.75it/s]



375it [00:09, 39.44it/s]

====> Epoch: 7 Average loss: 0.0146
Training ...



8it [00:00, 37.09it/s]



313it [00:05, 60.52it/s]



375it [00:06, 59.13it/s]

====> Epoch: 8 Average loss: 0.0140
Training ...



8it [00:00, 39.92it/s]



306it [00:06, 33.93it/s]



375it [00:08, 44.99it/s]

====> Epoch: 9 Average loss: 0.0136
Training ...



5it [00:00, 21.36it/s]



309it [00:06, 59.04it/s]



375it [00:07, 52.06it/s]

====> Epoch: 10 Average loss: 0.0133
Training ...



10it [00:00, 44.02it/s]



304it [00:05, 44.86it/s]



375it [00:07, 52.70it/s]

====> Epoch: 11 Average loss: 0.0133
Training ...



5it [00:00, 21.44it/s]



309it [00:07, 62.92it/s]



375it [00:08, 45.06it/s]

====> Epoch: 12 Average loss: 0.0122
Training ...



7it [00:00, 35.77it/s]



312it [00:05, 59.74it/s]



375it [00:06, 59.29it/s]

====> Epoch: 13 Average loss: 0.0128
Training ...



7it [00:00, 31.70it/s]



305it [00:08, 45.57it/s]



375it [00:09, 40.04it/s]

====> Epoch: 14 Average loss: 0.0126
Evaluation ...



625it [00:11, 55.62it/s]

====> Initial accuracy: 91.9 
Iteration: 0: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



  outputs = softmax(outputs)
3375it [01:07, 49.88it/s]


Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 7000, len(du) 54000
Update size of `dl`  and `du` by adding 1731 hcs samples in `dl` len(dl): 8731, len(du) 54000
Iteration: 0 fine-tune the model on dh U dl
Training ...


9it [00:00, 42.32it/s]



309it [00:08, 41.69it/s]



546it [00:12, 44.00it/s]

====> Epoch: 0 Average loss: 0.0958
Training ...



9it [00:00, 42.10it/s]



310it [00:05, 58.28it/s]



546it [00:11, 48.86it/s]

====> Epoch: 1 Average loss: 0.0803
Training ...



5it [00:00, 19.89it/s]



307it [00:06, 60.64it/s]



546it [00:10, 54.02it/s]

====> Epoch: 2 Average loss: 0.0771
Training ...



7it [00:00, 33.48it/s]



307it [00:07, 38.66it/s]



546it [00:12, 44.08it/s]

====> Epoch: 3 Average loss: 0.0775
Training ...



7it [00:00, 34.04it/s]



313it [00:05, 60.75it/s]



546it [00:10, 52.76it/s]

====> Epoch: 4 Average loss: 0.0774
Training ...



5it [00:00, 19.34it/s]



311it [00:07, 64.14it/s]



546it [00:10, 50.12it/s]

====> Epoch: 5 Average loss: 0.0777
Training ...



9it [00:00, 43.03it/s]



305it [00:06, 38.66it/s]



546it [00:12, 43.86it/s]

====> Epoch: 6 Average loss: 0.0758
Training ...



9it [00:00, 42.18it/s]



313it [00:05, 60.31it/s]



546it [00:09, 57.41it/s]

====> Epoch: 7 Average loss: 0.0766
Training ...



4it [00:00, 19.85it/s]



310it [00:07, 62.23it/s]



546it [00:11, 46.71it/s]

====> Epoch: 8 Average loss: 0.0765
Training ...



8it [00:00, 35.63it/s]



305it [00:05, 38.24it/s]



546it [00:12, 44.98it/s]

====> Epoch: 9 Average loss: 0.0749
Training ...



6it [00:00, 25.86it/s]



312it [00:05, 62.75it/s]



546it [00:09, 58.89it/s]

====> Epoch: 10 Average loss: 0.0740
Training ...



8it [00:00, 37.72it/s]



306it [00:08, 38.24it/s]



546it [00:12, 44.18it/s]

====> Epoch: 11 Average loss: 0.0757
Training ...



9it [00:00, 42.66it/s]



311it [00:05, 62.66it/s]



546it [00:11, 48.84it/s]


====> Epoch: 12 Average loss: 0.0755
Training ...


5it [00:00, 21.63it/s]



309it [00:06, 62.22it/s]



546it [00:09, 55.12it/s]

====> Epoch: 13 Average loss: 0.0768
Training ...



12it [00:00, 53.37it/s]



308it [00:06, 37.51it/s]



546it [00:12, 44.56it/s]


====> Epoch: 14 Average loss: 0.0744
remove 1000 uncertain samples from du
Evaluation ...


625it [00:12, 50.44it/s]

Iteration: 0, len(dl): 8731, len(du): 53000, len(dh) 1731, acc: 81.86 
Iteration: 1: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



3313it [01:05, 50.77it/s]


Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 9731, len(du) 53000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 9731, len(du) 53000
Iteration: 1 fine-tune the model on dh U dl
Training ...


7it [00:00, 36.28it/s]



309it [00:07, 39.90it/s]



609it [00:13, 45.39it/s]

====> Epoch: 0 Average loss: 0.0710
Training ...



6it [00:00, 31.28it/s]



310it [00:05, 63.76it/s]



602it [00:12, 32.56it/s]



609it [00:12, 47.38it/s]

====> Epoch: 1 Average loss: 0.0696
Training ...



2it [00:00, 12.39it/s]



313it [00:05, 61.04it/s]



609it [00:10, 57.51it/s]

====> Epoch: 2 Average loss: 0.0711
Training ...



7it [00:00, 34.77it/s]



307it [00:08, 44.94it/s]



609it [00:13, 45.41it/s]

====> Epoch: 3 Average loss: 0.0690
Training ...



8it [00:00, 37.39it/s]



306it [00:05, 45.57it/s]



609it [00:13, 45.79it/s]

====> Epoch: 4 Average loss: 0.0715
Training ...



8it [00:00, 41.18it/s]



308it [00:05, 62.59it/s]



602it [00:10, 36.00it/s]



609it [00:10, 55.53it/s]

====> Epoch: 5 Average loss: 0.0714
Training ...



5it [00:00, 20.48it/s]



309it [00:07, 61.13it/s]



609it [00:12, 48.97it/s]

====> Epoch: 6 Average loss: 0.0699
Training ...



11it [00:00, 50.43it/s]



305it [00:06, 36.57it/s]



609it [00:13, 45.63it/s]

====> Epoch: 7 Average loss: 0.0690
Training ...



9it [00:00, 39.75it/s]



309it [00:05, 60.76it/s]



605it [00:11, 42.10it/s]



609it [00:12, 50.44it/s]

====> Epoch: 8 Average loss: 0.0702
Training ...



5it [00:00, 21.11it/s]



307it [00:06, 57.41it/s]



609it [00:11, 54.08it/s]

====> Epoch: 9 Average loss: 0.0688
Training ...



8it [00:00, 41.45it/s]



307it [00:07, 39.33it/s]



609it [00:13, 44.93it/s]

====> Epoch: 10 Average loss: 0.0720
Training ...



8it [00:00, 41.39it/s]



308it [00:05, 59.44it/s]



604it [00:12, 39.28it/s]



609it [00:12, 48.59it/s]

====> Epoch: 11 Average loss: 0.0707
Training ...



5it [00:00, 20.95it/s]



313it [00:05, 64.44it/s]



609it [00:10, 57.38it/s]

====> Epoch: 12 Average loss: 0.0717
Training ...



8it [00:00, 40.40it/s]



305it [00:08, 37.68it/s]



609it [00:13, 44.75it/s]

====> Epoch: 13 Average loss: 0.0683
Training ...



8it [00:00, 41.68it/s]



306it [00:05, 57.86it/s]



606it [00:13, 43.21it/s]



609it [00:13, 45.99it/s]


====> Epoch: 14 Average loss: 0.0700
remove 1000 uncertain samples from du
Evaluation ...


625it [00:11, 55.74it/s]

Iteration: 1, len(dl): 9731, len(du): 52000, len(dh) 0, acc: 84.49 
Iteration: 2: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



3250it [01:05, 49.65it/s]


Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 10731, len(du) 52000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 10731, len(du) 52000
Iteration: 2 fine-tune the model on dh U dl
Training ...


8it [00:00, 36.34it/s]



305it [00:05, 34.73it/s]



610it [00:13, 60.75it/s]



671it [00:14, 47.49it/s]

====> Epoch: 0 Average loss: 0.0675
Training ...



11it [00:00, 52.81it/s]



312it [00:05, 59.68it/s]



604it [00:11, 36.25it/s]



671it [00:13, 49.04it/s]

====> Epoch: 1 Average loss: 0.0672
Training ...



5it [00:00, 21.26it/s]



308it [00:05, 63.27it/s]



608it [00:10, 59.39it/s]



671it [00:11, 56.22it/s]

====> Epoch: 2 Average loss: 0.0668
Training ...



5it [00:00, 23.33it/s]



308it [00:07, 49.97it/s]



612it [00:12, 58.55it/s]



671it [00:13, 48.02it/s]

====> Epoch: 3 Average loss: 0.0664
Training ...



9it [00:00, 44.10it/s]



304it [00:06, 35.14it/s]



611it [00:13, 59.11it/s]



671it [00:14, 46.74it/s]

====> Epoch: 4 Average loss: 0.0663
Training ...



9it [00:00, 46.80it/s]



311it [00:05, 61.29it/s]



608it [00:12, 35.84it/s]



671it [00:14, 46.52it/s]

====> Epoch: 5 Average loss: 0.0668
Training ...



6it [00:00, 31.81it/s]



307it [00:05, 58.46it/s]



606it [00:10, 42.73it/s]



671it [00:12, 54.17it/s]

====> Epoch: 6 Average loss: 0.0662
Training ...



4it [00:00, 19.29it/s]



307it [00:06, 59.16it/s]



610it [00:11, 60.07it/s]



671it [00:13, 50.88it/s]

====> Epoch: 7 Average loss: 0.0665
Training ...



8it [00:00, 38.27it/s]



306it [00:07, 36.30it/s]



611it [00:13, 62.00it/s]



671it [00:14, 46.59it/s]

====> Epoch: 8 Average loss: 0.0661
Training ...



9it [00:00, 44.99it/s]



305it [00:05, 45.75it/s]



613it [00:13, 54.06it/s]



671it [00:14, 45.90it/s]

====> Epoch: 9 Average loss: 0.0666
Training ...



9it [00:00, 43.98it/s]



311it [00:05, 62.24it/s]



605it [00:11, 35.88it/s]



671it [00:13, 50.30it/s]

====> Epoch: 10 Average loss: 0.0660
Training ...



5it [00:00, 19.99it/s]



307it [00:06, 62.84it/s]



607it [00:11, 60.37it/s]



671it [00:12, 55.20it/s]

====> Epoch: 11 Average loss: 0.0663
Training ...



5it [00:00, 22.45it/s]



306it [00:08, 46.51it/s]



607it [00:13, 58.64it/s]



671it [00:14, 45.62it/s]

====> Epoch: 12 Average loss: 0.0662
Training ...



7it [00:00, 36.66it/s]



305it [00:06, 41.72it/s]



610it [00:13, 59.93it/s]



671it [00:14, 47.27it/s]

====> Epoch: 13 Average loss: 0.0666
Training ...



11it [00:00, 54.68it/s]



307it [00:05, 47.67it/s]



608it [00:12, 41.51it/s]



671it [00:13, 48.46it/s]


====> Epoch: 14 Average loss: 0.0655
remove 1000 uncertain samples from du
Evaluation ...


625it [00:10, 59.90it/s]

Iteration: 2, len(dl): 10731, len(du): 51000, len(dh) 0, acc: 85.55 
Iteration: 3: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



3188it [01:04, 49.07it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 11731, len(du) 51000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 11731, len(du) 51000
Iteration: 3 fine-tune the model on dh U dl
Training ...



7it [00:00, 34.71it/s]



313it [00:05, 59.23it/s]



609it [00:12, 41.32it/s]



734it [00:15, 47.28it/s]

====> Epoch: 0 Average loss: 0.0638
Training ...



8it [00:00, 38.33it/s]



312it [00:05, 60.03it/s]



608it [00:10, 35.31it/s]



734it [00:14, 51.97it/s]

====> Epoch: 1 Average loss: 0.0635
Training ...



4it [00:00, 19.71it/s]



308it [00:06, 54.43it/s]



612it [00:11, 61.42it/s]



734it [00:13, 52.81it/s]

====> Epoch: 2 Average loss: 0.0639
Training ...



5it [00:00, 19.52it/s]



308it [00:07, 62.09it/s]



613it [00:12, 61.64it/s]



734it [00:14, 50.86it/s]

====> Epoch: 3 Average loss: 0.0621
Training ...



7it [00:00, 33.30it/s]



308it [00:07, 35.83it/s]



610it [00:13, 61.09it/s]



734it [00:15, 47.24it/s]

====> Epoch: 4 Average loss: 0.0640
Training ...



8it [00:00, 39.08it/s]



310it [00:06, 42.24it/s]



608it [00:13, 58.53it/s]



734it [00:15, 48.25it/s]

====> Epoch: 5 Average loss: 0.0637
Training ...



8it [00:00, 40.48it/s]



311it [00:05, 56.81it/s]



607it [00:12, 34.70it/s]



734it [00:15, 46.85it/s]

====> Epoch: 6 Average loss: 0.0637
Training ...



8it [00:00, 38.12it/s]



311it [00:05, 61.17it/s]



608it [00:10, 36.41it/s]



734it [00:14, 51.40it/s]


====> Epoch: 7 Average loss: 0.0632
Training ...


5it [00:00, 18.12it/s]



311it [00:06, 54.10it/s]



613it [00:11, 63.37it/s]



734it [00:13, 52.58it/s]

====> Epoch: 8 Average loss: 0.0639
Training ...



5it [00:00, 20.94it/s]



307it [00:07, 59.56it/s]



611it [00:12, 59.18it/s]



734it [00:14, 51.31it/s]

====> Epoch: 9 Average loss: 0.0634
Training ...



8it [00:00, 38.48it/s]



308it [00:08, 36.25it/s]



609it [00:13, 60.97it/s]



734it [00:15, 47.05it/s]

====> Epoch: 10 Average loss: 0.0640
Training ...



9it [00:00, 42.11it/s]



309it [00:06, 39.49it/s]



613it [00:13, 60.54it/s]



734it [00:15, 48.12it/s]

====> Epoch: 11 Average loss: 0.0627
Training ...



9it [00:00, 39.81it/s]



312it [00:05, 61.92it/s]



607it [00:12, 35.59it/s]



734it [00:15, 47.09it/s]

====> Epoch: 12 Average loss: 0.0641
Training ...



11it [00:00, 51.58it/s]



312it [00:05, 60.75it/s]



604it [00:11, 35.87it/s]



734it [00:14, 49.32it/s]

====> Epoch: 13 Average loss: 0.0621
Training ...



5it [00:00, 19.13it/s]



307it [00:05, 54.70it/s]



613it [00:11, 59.53it/s]



734it [00:14, 51.50it/s]


====> Epoch: 14 Average loss: 0.0634
remove 1000 uncertain samples from du
Evaluation ...


625it [00:11, 52.28it/s]

Iteration: 3, len(dl): 11731, len(du): 50000, len(dh) 0, acc: 89.38 
Iteration: 4: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



3125it [01:06, 47.05it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 12731, len(du) 50000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 12731, len(du) 50000
Iteration: 4 fine-tune the model on dh U dl
Training ...



7it [00:00, 35.87it/s]



308it [00:05, 60.31it/s]



606it [00:11, 33.89it/s]



796it [00:16, 47.00it/s]

====> Epoch: 0 Average loss: 0.0620
Training ...



7it [00:00, 34.68it/s]



313it [00:05, 61.94it/s]



605it [00:10, 34.79it/s]



796it [00:16, 48.78it/s]

====> Epoch: 1 Average loss: 0.0610
Training ...



5it [00:00, 19.32it/s]



310it [00:05, 59.54it/s]



608it [00:10, 59.30it/s]



796it [00:15, 49.88it/s]

====> Epoch: 2 Average loss: 0.0612
Training ...



5it [00:00, 17.80it/s]



313it [00:06, 58.35it/s]



607it [00:11, 58.00it/s]



796it [00:16, 49.36it/s]

====> Epoch: 3 Average loss: 0.0613
Training ...



5it [00:00, 22.42it/s]



313it [00:06, 59.74it/s]



607it [00:11, 59.47it/s]



796it [00:15, 49.86it/s]

====> Epoch: 4 Average loss: 0.0617
Training ...



5it [00:00, 18.17it/s]



306it [00:07, 61.15it/s]



610it [00:12, 61.20it/s]



796it [00:15, 50.00it/s]

====> Epoch: 5 Average loss: 0.0609
Training ...



5it [00:00, 19.27it/s]



313it [00:07, 60.41it/s]



614it [00:12, 64.05it/s]



796it [00:16, 49.57it/s]

====> Epoch: 6 Average loss: 0.0591
Training ...



8it [00:00, 38.43it/s]



308it [00:08, 43.40it/s]



612it [00:13, 58.40it/s]



796it [00:16, 48.00it/s]

====> Epoch: 7 Average loss: 0.0613
Training ...



8it [00:00, 41.11it/s]



309it [00:07, 43.31it/s]



607it [00:13, 58.75it/s]



796it [00:16, 48.36it/s]

====> Epoch: 8 Average loss: 0.0619
Training ...



9it [00:00, 40.10it/s]



307it [00:06, 35.51it/s]



609it [00:13, 61.51it/s]



796it [00:16, 47.95it/s]

====> Epoch: 9 Average loss: 0.0608
Training ...



9it [00:00, 42.62it/s]



307it [00:05, 57.49it/s]



608it [00:13, 38.23it/s]



796it [00:16, 48.36it/s]

====> Epoch: 10 Average loss: 0.0606
Training ...



8it [00:00, 40.43it/s]



313it [00:05, 59.02it/s]



604it [00:12, 38.01it/s]



796it [00:16, 48.07it/s]

====> Epoch: 11 Average loss: 0.0611
Training ...



7it [00:00, 35.29it/s]



304it [00:05, 60.21it/s]



607it [00:11, 38.23it/s]



796it [00:16, 47.62it/s]

====> Epoch: 12 Average loss: 0.0615
Training ...



8it [00:00, 40.65it/s]



307it [00:05, 58.28it/s]



607it [00:10, 50.11it/s]



796it [00:15, 51.06it/s]

====> Epoch: 13 Average loss: 0.0621
Training ...



5it [00:00, 18.30it/s]



311it [00:06, 58.85it/s]



607it [00:11, 58.70it/s]



796it [00:15, 50.96it/s]


====> Epoch: 14 Average loss: 0.0618
remove 1000 uncertain samples from du
Evaluation ...


625it [00:11, 53.48it/s]

Iteration: 4, len(dl): 12731, len(du): 49000, len(dh) 0, acc: 88.47 
Iteration: 5: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



3063it [01:03, 47.88it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 13731, len(du) 49000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 13731, len(du) 49000
Iteration: 5 fine-tune the model on dh U dl
Training ...



5it [00:00, 21.63it/s]



311it [00:05, 63.57it/s]



611it [00:10, 58.31it/s]



859it [00:17, 48.98it/s]

====> Epoch: 0 Average loss: 0.0570
Training ...



5it [00:00, 23.55it/s]



310it [00:05, 58.90it/s]



612it [00:10, 59.10it/s]



859it [00:17, 50.45it/s]

====> Epoch: 1 Average loss: 0.0594
Training ...



4it [00:00, 19.64it/s]



311it [00:05, 56.46it/s]



611it [00:11, 61.82it/s]



859it [00:17, 49.74it/s]

====> Epoch: 2 Average loss: 0.0588
Training ...



5it [00:00, 19.64it/s]



311it [00:06, 62.29it/s]



606it [00:10, 63.02it/s]



859it [00:16, 51.96it/s]

====> Epoch: 3 Average loss: 0.0597
Training ...



5it [00:00, 22.70it/s]



305it [00:06, 59.71it/s]



607it [00:11, 63.02it/s]



859it [00:17, 50.33it/s]

====> Epoch: 4 Average loss: 0.0585
Training ...



4it [00:00, 19.98it/s]



311it [00:06, 58.85it/s]



610it [00:11, 59.54it/s]



859it [00:17, 50.07it/s]

====> Epoch: 5 Average loss: 0.0577
Training ...



5it [00:00, 21.82it/s]



309it [00:06, 58.11it/s]



608it [00:11, 59.97it/s]



859it [00:17, 49.29it/s]

====> Epoch: 6 Average loss: 0.0587
Training ...



5it [00:00, 21.26it/s]



311it [00:06, 58.02it/s]



607it [00:11, 57.99it/s]



859it [00:17, 48.52it/s]

====> Epoch: 7 Average loss: 0.0591
Training ...



5it [00:00, 22.16it/s]



310it [00:06, 57.89it/s]



607it [00:11, 59.89it/s]



859it [00:17, 49.80it/s]

====> Epoch: 8 Average loss: 0.0590
Training ...



5it [00:00, 17.58it/s]



307it [00:06, 54.82it/s]



607it [00:11, 59.31it/s]



859it [00:17, 49.70it/s]

====> Epoch: 9 Average loss: 0.0591
Training ...



6it [00:00, 27.96it/s]



310it [00:06, 57.99it/s]



611it [00:11, 61.94it/s]



859it [00:17, 49.18it/s]

====> Epoch: 10 Average loss: 0.0597
Training ...



4it [00:00, 19.44it/s]



312it [00:06, 60.95it/s]



610it [00:11, 60.57it/s]



859it [00:17, 50.22it/s]

====> Epoch: 11 Average loss: 0.0582
Training ...



5it [00:00, 19.37it/s]



307it [00:06, 62.30it/s]



608it [00:11, 60.08it/s]



859it [00:17, 48.48it/s]

====> Epoch: 12 Average loss: 0.0589
Training ...



5it [00:00, 19.56it/s]



306it [00:06, 62.17it/s]



606it [00:11, 60.51it/s]



859it [00:17, 49.85it/s]

====> Epoch: 13 Average loss: 0.0596
Training ...



4it [00:00, 17.30it/s]



314it [00:06, 62.89it/s]



610it [00:11, 59.91it/s]



859it [00:17, 48.62it/s]


====> Epoch: 14 Average loss: 0.0591
remove 1000 uncertain samples from du
Evaluation ...


625it [00:11, 53.25it/s]

Iteration: 5, len(dl): 13731, len(du): 48000, len(dh) 0, acc: 84.49 
Iteration: 6: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



3000it [01:02, 48.26it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 14731, len(du) 48000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 14731, len(du) 48000
Iteration: 6 fine-tune the model on dh U dl
Training ...



6it [00:00, 23.91it/s]



307it [00:05, 58.19it/s]



611it [00:11, 59.74it/s]



907it [00:18, 39.76it/s]



921it [00:18, 48.57it/s]

====> Epoch: 0 Average loss: 0.0573
Training ...



5it [00:00, 22.01it/s]



309it [00:05, 60.62it/s]



609it [00:10, 57.39it/s]



906it [00:18, 40.58it/s]



921it [00:19, 48.38it/s]

====> Epoch: 1 Average loss: 0.0573
Training ...



8it [00:00, 39.66it/s]



309it [00:05, 62.50it/s]



607it [00:10, 38.36it/s]



910it [00:18, 44.80it/s]



921it [00:18, 49.28it/s]

====> Epoch: 2 Average loss: 0.0561
Training ...



8it [00:00, 38.06it/s]



308it [00:05, 62.01it/s]



607it [00:10, 34.46it/s]



913it [00:18, 52.34it/s]



921it [00:18, 48.84it/s]

====> Epoch: 3 Average loss: 0.0572
Training ...



10it [00:00, 53.36it/s]



308it [00:05, 59.66it/s]



609it [00:10, 41.73it/s]



908it [00:18, 52.40it/s]



921it [00:18, 49.62it/s]

====> Epoch: 4 Average loss: 0.0571
Training ...



9it [00:00, 44.82it/s]



311it [00:05, 54.70it/s]



605it [00:11, 34.00it/s]



907it [00:18, 56.04it/s]



921it [00:19, 48.03it/s]

====> Epoch: 5 Average loss: 0.0576
Training ...



10it [00:00, 43.71it/s]



309it [00:05, 59.71it/s]



605it [00:11, 36.98it/s]



909it [00:18, 58.30it/s]



921it [00:18, 48.54it/s]

====> Epoch: 6 Average loss: 0.0569
Training ...



9it [00:00, 41.38it/s]



309it [00:05, 60.33it/s]



605it [00:11, 35.64it/s]



907it [00:18, 59.41it/s]



921it [00:18, 49.47it/s]

====> Epoch: 7 Average loss: 0.0568
Training ...



9it [00:00, 42.50it/s]



310it [00:05, 56.29it/s]



605it [00:12, 37.89it/s]



907it [00:18, 58.63it/s]



921it [00:19, 48.43it/s]

====> Epoch: 8 Average loss: 0.0557
Training ...



7it [00:00, 35.33it/s]



312it [00:05, 60.67it/s]



607it [00:13, 34.35it/s]



908it [00:18, 62.33it/s]



921it [00:18, 48.49it/s]

====> Epoch: 9 Average loss: 0.0575
Training ...



7it [00:00, 35.04it/s]



305it [00:05, 44.54it/s]



609it [00:13, 41.73it/s]



906it [00:18, 66.23it/s]



921it [00:18, 49.15it/s]

====> Epoch: 10 Average loss: 0.0559
Training ...



10it [00:00, 46.50it/s]



305it [00:05, 39.95it/s]



609it [00:13, 50.46it/s]



908it [00:18, 61.75it/s]



921it [00:18, 48.66it/s]

====> Epoch: 11 Average loss: 0.0567
Training ...



9it [00:00, 44.20it/s]



306it [00:05, 38.17it/s]



612it [00:13, 57.54it/s]



911it [00:18, 60.27it/s]



921it [00:18, 49.08it/s]

====> Epoch: 12 Average loss: 0.0569
Training ...



9it [00:00, 41.21it/s]



306it [00:06, 38.37it/s]



611it [00:13, 60.94it/s]



911it [00:18, 59.20it/s]



921it [00:18, 48.60it/s]

====> Epoch: 13 Average loss: 0.0569
Training ...



8it [00:00, 41.47it/s]



306it [00:06, 41.40it/s]



609it [00:13, 58.23it/s]



910it [00:18, 59.80it/s]



921it [00:18, 48.94it/s]


====> Epoch: 14 Average loss: 0.0573
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 45.58it/s]

Iteration: 6, len(dl): 14731, len(du): 47000, len(dh) 0, acc: 88.3 
Iteration: 7: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2938it [01:00, 48.84it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 15731, len(du) 47000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 15731, len(du) 47000
Iteration: 7 fine-tune the model on dh U dl
Training ...



8it [00:00, 37.16it/s]



305it [00:07, 38.33it/s]



610it [00:13, 59.70it/s]



913it [00:18, 59.58it/s]



984it [00:20, 48.60it/s]

====> Epoch: 0 Average loss: 0.0556
Training ...



7it [00:00, 29.18it/s]



307it [00:08, 42.50it/s]



611it [00:13, 55.02it/s]



909it [00:19, 41.10it/s]



984it [00:21, 45.50it/s]

====> Epoch: 1 Average loss: 0.0560
Training ...



5it [00:00, 21.06it/s]



309it [00:07, 60.06it/s]



607it [00:12, 57.86it/s]



906it [00:19, 34.94it/s]



984it [00:21, 45.45it/s]

====> Epoch: 2 Average loss: 0.0561
Training ...



4it [00:00, 16.44it/s]



310it [00:05, 57.61it/s]



608it [00:11, 45.86it/s]



911it [00:19, 44.84it/s]



984it [00:20, 46.96it/s]

====> Epoch: 3 Average loss: 0.0557
Training ...



7it [00:00, 35.77it/s]



311it [00:05, 56.77it/s]



606it [00:12, 34.01it/s]



907it [00:19, 53.89it/s]



984it [00:20, 47.65it/s]

====> Epoch: 4 Average loss: 0.0560
Training ...



8it [00:00, 40.93it/s]



309it [00:05, 54.78it/s]



608it [00:13, 36.30it/s]



908it [00:19, 59.87it/s]



984it [00:20, 47.74it/s]

====> Epoch: 5 Average loss: 0.0559
Training ...



8it [00:00, 40.91it/s]



309it [00:06, 40.50it/s]



607it [00:13, 57.03it/s]



908it [00:19, 59.08it/s]



984it [00:20, 48.18it/s]

====> Epoch: 6 Average loss: 0.0566
Training ...



6it [00:00, 30.03it/s]



307it [00:07, 37.15it/s]



609it [00:14, 53.34it/s]



909it [00:19, 56.21it/s]



984it [00:20, 47.52it/s]

====> Epoch: 7 Average loss: 0.0557
Training ...



5it [00:00, 22.77it/s]



304it [00:08, 37.35it/s]



609it [00:13, 59.92it/s]



903it [00:19, 46.38it/s]



984it [00:21, 46.26it/s]

====> Epoch: 8 Average loss: 0.0559
Training ...



5it [00:00, 21.10it/s]



313it [00:07, 60.99it/s]



610it [00:12, 56.58it/s]



905it [00:18, 36.37it/s]



984it [00:20, 46.95it/s]

====> Epoch: 9 Average loss: 0.0551
Training ...



5it [00:00, 19.75it/s]



312it [00:06, 54.09it/s]



610it [00:11, 54.78it/s]



906it [00:19, 38.17it/s]



984it [00:21, 45.98it/s]

====> Epoch: 10 Average loss: 0.0556
Training ...



8it [00:00, 39.89it/s]



309it [00:05, 57.66it/s]



606it [00:11, 34.39it/s]



910it [00:18, 59.65it/s]



984it [00:20, 48.36it/s]

====> Epoch: 11 Average loss: 0.0552
Training ...



9it [00:00, 40.91it/s]



309it [00:05, 58.96it/s]



606it [00:12, 37.14it/s]



909it [00:19, 58.42it/s]



984it [00:20, 48.12it/s]

====> Epoch: 12 Average loss: 0.0557
Training ...



7it [00:00, 34.42it/s]



306it [00:05, 35.06it/s]



608it [00:13, 51.54it/s]



910it [00:18, 57.15it/s]



984it [00:20, 48.66it/s]

====> Epoch: 13 Average loss: 0.0546
Training ...



8it [00:00, 42.75it/s]



307it [00:07, 34.66it/s]



607it [00:13, 57.10it/s]



910it [00:19, 55.67it/s]



984it [00:20, 47.75it/s]


====> Epoch: 14 Average loss: 0.0556
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 44.83it/s]

Iteration: 7, len(dl): 15731, len(du): 46000, len(dh) 0, acc: 89.39 
Iteration: 8: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2875it [00:59, 48.31it/s]


Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 16731, len(du) 46000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 16731, len(du) 46000
Iteration: 8 fine-tune the model on dh U dl
Training ...


6it [00:00, 30.57it/s]



307it [00:07, 36.22it/s]



607it [00:14, 57.06it/s]



908it [00:19, 58.66it/s]



1046it [00:22, 46.25it/s]

====> Epoch: 0 Average loss: 0.0537
Training ...



4it [00:00, 16.58it/s]



310it [00:08, 57.28it/s]



611it [00:13, 62.45it/s]



905it [00:20, 35.25it/s]



1046it [00:24, 43.54it/s]

====> Epoch: 1 Average loss: 0.0546
Training ...



5it [00:00, 19.69it/s]



309it [00:05, 55.55it/s]



604it [00:11, 39.68it/s]



906it [00:19, 53.01it/s]



1046it [00:22, 47.24it/s]

====> Epoch: 2 Average loss: 0.0542
Training ...



9it [00:00, 43.97it/s]



304it [00:05, 57.51it/s]



605it [00:12, 37.40it/s]



910it [00:18, 60.15it/s]



1046it [00:21, 49.49it/s]

====> Epoch: 3 Average loss: 0.0551
Training ...



8it [00:00, 40.54it/s]



308it [00:06, 41.34it/s]



605it [00:13, 54.35it/s]



911it [00:18, 57.12it/s]



1046it [00:21, 49.20it/s]

====> Epoch: 4 Average loss: 0.0534
Training ...



8it [00:00, 38.88it/s]



305it [00:07, 38.88it/s]



611it [00:13, 56.72it/s]



914it [00:18, 62.83it/s]



1046it [00:21, 47.94it/s]

====> Epoch: 5 Average loss: 0.0534
Training ...



5it [00:00, 20.29it/s]



309it [00:07, 56.57it/s]



608it [00:12, 55.87it/s]



908it [00:19, 35.08it/s]



1046it [00:23, 44.64it/s]

====> Epoch: 6 Average loss: 0.0541
Training ...



3it [00:00, 14.15it/s]



310it [00:06, 57.00it/s]



608it [00:11, 51.57it/s]



909it [00:19, 40.35it/s]



1046it [00:21, 47.73it/s]

====> Epoch: 7 Average loss: 0.0544
Training ...



7it [00:00, 36.66it/s]



308it [00:05, 55.74it/s]



605it [00:12, 36.21it/s]



907it [00:18, 57.61it/s]



1046it [00:21, 49.32it/s]

====> Epoch: 8 Average loss: 0.0543
Training ...



8it [00:00, 40.89it/s]



305it [00:05, 43.06it/s]



612it [00:13, 49.05it/s]



907it [00:18, 58.05it/s]



1046it [00:21, 49.34it/s]

====> Epoch: 9 Average loss: 0.0536
Training ...



8it [00:00, 36.44it/s]



308it [00:07, 39.05it/s]



610it [00:13, 59.06it/s]



908it [00:18, 61.23it/s]



1046it [00:21, 49.12it/s]

====> Epoch: 10 Average loss: 0.0539
Training ...



4it [00:00, 17.70it/s]



308it [00:08, 50.80it/s]



612it [00:13, 55.51it/s]



906it [00:18, 40.20it/s]



1046it [00:22, 46.51it/s]

====> Epoch: 11 Average loss: 0.0542
Training ...



2it [00:00,  9.40it/s]



312it [00:06, 60.53it/s]



607it [00:11, 55.25it/s]



905it [00:18, 36.01it/s]



1046it [00:22, 46.46it/s]

====> Epoch: 12 Average loss: 0.0553
Training ...



9it [00:00, 43.68it/s]



310it [00:05, 61.40it/s]



605it [00:10, 33.27it/s]



912it [00:18, 59.18it/s]



1046it [00:21, 49.50it/s]

====> Epoch: 13 Average loss: 0.0542
Training ...



6it [00:00, 33.05it/s]



308it [00:05, 57.76it/s]



607it [00:12, 41.20it/s]



910it [00:18, 56.52it/s]



1046it [00:21, 48.77it/s]


====> Epoch: 14 Average loss: 0.0534
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 44.80it/s]

Iteration: 8, len(dl): 16731, len(du): 45000, len(dh) 0, acc: 89.74 
Iteration: 9: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2813it [00:58, 47.85it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 17731, len(du) 45000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 17731, len(du) 45000
Iteration: 9 fine-tune the model on dh U dl
Training ...



7it [00:00, 34.63it/s]



312it [00:05, 55.75it/s]



607it [00:13, 33.37it/s]



909it [00:19, 56.75it/s]



1109it [00:23, 47.70it/s]

====> Epoch: 0 Average loss: 0.0531
Training ...



9it [00:00, 40.37it/s]



306it [00:07, 37.02it/s]



610it [00:14, 57.29it/s]



908it [00:19, 55.29it/s]



1109it [00:23, 46.34it/s]

====> Epoch: 1 Average loss: 0.0537
Training ...



4it [00:00, 13.62it/s]



309it [00:07, 53.52it/s]



609it [00:13, 57.73it/s]



907it [00:19, 39.31it/s]



1109it [00:25, 43.68it/s]


====> Epoch: 2 Average loss: 0.0534
Training ...


7it [00:00, 33.58it/s]



306it [00:05, 55.62it/s]



607it [00:11, 35.38it/s]



909it [00:19, 46.40it/s]



1109it [00:23, 48.02it/s]

====> Epoch: 3 Average loss: 0.0531
Training ...



7it [00:00, 34.62it/s]



307it [00:05, 47.79it/s]



611it [00:13, 43.90it/s]



907it [00:19, 60.31it/s]



1109it [00:22, 49.04it/s]

====> Epoch: 4 Average loss: 0.0537
Training ...



6it [00:00, 31.09it/s]



306it [00:08, 34.62it/s]



609it [00:13, 61.05it/s]



907it [00:19, 56.89it/s]



1109it [00:24, 46.00it/s]

====> Epoch: 5 Average loss: 0.0543
Training ...



7it [00:00, 32.05it/s]



314it [00:06, 61.02it/s]



612it [00:11, 59.59it/s]



907it [00:19, 37.11it/s]



1109it [00:23, 46.85it/s]

====> Epoch: 6 Average loss: 0.0531
Training ...



9it [00:00, 40.29it/s]



307it [00:05, 55.54it/s]



608it [00:12, 42.08it/s]



909it [00:18, 58.72it/s]



1109it [00:22, 49.54it/s]

====> Epoch: 7 Average loss: 0.0533
Training ...



9it [00:00, 43.07it/s]



308it [00:05, 37.95it/s]



610it [00:13, 51.49it/s]



909it [00:18, 58.13it/s]



1109it [00:22, 49.44it/s]

====> Epoch: 8 Average loss: 0.0529
Training ...



7it [00:00, 35.26it/s]



306it [00:08, 35.16it/s]



606it [00:14, 53.30it/s]



911it [00:19, 54.38it/s]



1109it [00:25, 44.32it/s]

====> Epoch: 9 Average loss: 0.0535
Training ...



5it [00:00, 20.21it/s]



309it [00:06, 56.16it/s]



614it [00:12, 61.37it/s]



904it [00:19, 32.23it/s]



1109it [00:23, 46.36it/s]

====> Epoch: 10 Average loss: 0.0536
Training ...



7it [00:00, 35.06it/s]



311it [00:05, 61.10it/s]



605it [00:12, 33.98it/s]



908it [00:18, 56.04it/s]



1109it [00:21, 50.61it/s]

====> Epoch: 11 Average loss: 0.0529
Training ...



8it [00:00, 37.25it/s]



308it [00:07, 34.55it/s]



609it [00:13, 54.95it/s]



908it [00:18, 59.00it/s]



1109it [00:23, 47.52it/s]


====> Epoch: 12 Average loss: 0.0540
Training ...


5it [00:00, 21.66it/s]



311it [00:06, 59.62it/s]



612it [00:11, 56.37it/s]



906it [00:18, 36.19it/s]



1109it [00:22, 48.89it/s]

====> Epoch: 13 Average loss: 0.0522
Training ...



7it [00:00, 34.20it/s]



307it [00:05, 55.13it/s]



606it [00:12, 38.34it/s]



908it [00:18, 54.78it/s]



1109it [00:21, 50.76it/s]


====> Epoch: 14 Average loss: 0.0532
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 47.30it/s]

Iteration: 9, len(dl): 17731, len(du): 44000, len(dh) 0, acc: 84.33 
Iteration: 10: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2750it [00:56, 48.74it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 18731, len(du) 44000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 18731, len(du) 44000
Iteration: 10 fine-tune the model on dh U dl
Training ...



9it [00:00, 42.33it/s]



307it [00:07, 49.90it/s]



611it [00:13, 61.66it/s]



904it [00:18, 36.78it/s]



1171it [00:25, 45.90it/s]

====> Epoch: 0 Average loss: 0.0521
Training ...



6it [00:00, 29.27it/s]



312it [00:05, 60.75it/s]



605it [00:11, 38.72it/s]



910it [00:18, 60.57it/s]



1171it [00:23, 50.89it/s]

====> Epoch: 1 Average loss: 0.0512
Training ...



7it [00:00, 36.34it/s]



307it [00:06, 37.55it/s]



609it [00:13, 58.79it/s]



908it [00:18, 60.53it/s]



1171it [00:24, 47.27it/s]

====> Epoch: 2 Average loss: 0.0516
Training ...



4it [00:00, 15.44it/s]



306it [00:06, 53.42it/s]



609it [00:11, 58.70it/s]



907it [00:18, 52.39it/s]



1171it [00:23, 49.63it/s]

====> Epoch: 3 Average loss: 0.0508
Training ...



7it [00:00, 32.80it/s]



308it [00:06, 41.83it/s]



611it [00:13, 56.87it/s]



911it [00:18, 56.38it/s]



1171it [00:24, 48.41it/s]

====> Epoch: 4 Average loss: 0.0520
Training ...



4it [00:00, 17.78it/s]



309it [00:07, 54.00it/s]



609it [00:12, 56.88it/s]



905it [00:19, 35.74it/s]



1171it [00:24, 47.10it/s]

====> Epoch: 5 Average loss: 0.0518
Training ...



7it [00:00, 35.31it/s]



308it [00:05, 58.34it/s]



609it [00:13, 39.92it/s]



911it [00:18, 60.06it/s]



1171it [00:23, 50.71it/s]

====> Epoch: 6 Average loss: 0.0517
Training ...



4it [00:00, 20.06it/s]



307it [00:08, 57.91it/s]



607it [00:13, 55.37it/s]



909it [00:18, 40.08it/s]



1171it [00:25, 45.59it/s]

====> Epoch: 7 Average loss: 0.0516
Training ...



9it [00:00, 44.75it/s]



311it [00:05, 58.31it/s]



607it [00:11, 35.83it/s]



907it [00:18, 59.24it/s]



1171it [00:23, 50.62it/s]

====> Epoch: 8 Average loss: 0.0514
Training ...



6it [00:00, 28.87it/s]



306it [00:07, 35.69it/s]



607it [00:13, 55.02it/s]



910it [00:18, 57.96it/s]



1171it [00:25, 46.20it/s]

====> Epoch: 9 Average loss: 0.0513
Training ...



2it [00:00, 10.48it/s]



307it [00:05, 55.66it/s]



607it [00:11, 49.23it/s]



912it [00:19, 54.98it/s]



1171it [00:24, 48.77it/s]

====> Epoch: 10 Average loss: 0.0520
Training ...



9it [00:00, 38.36it/s]



306it [00:06, 35.15it/s]



611it [00:13, 54.37it/s]



909it [00:18, 56.74it/s]



1171it [00:24, 47.61it/s]

====> Epoch: 11 Average loss: 0.0520
Training ...



4it [00:00, 16.79it/s]



312it [00:06, 57.36it/s]



608it [00:11, 50.84it/s]



909it [00:19, 38.09it/s]



1171it [00:24, 48.41it/s]

====> Epoch: 12 Average loss: 0.0505
Training ...



7it [00:00, 37.14it/s]



310it [00:05, 62.58it/s]



608it [00:13, 52.51it/s]



907it [00:18, 56.82it/s]



1171it [00:23, 50.17it/s]

====> Epoch: 13 Average loss: 0.0518
Training ...



4it [00:00, 16.03it/s]



311it [00:07, 58.92it/s]



608it [00:12, 58.06it/s]



908it [00:19, 41.21it/s]



1171it [00:25, 46.73it/s]


====> Epoch: 14 Average loss: 0.0512
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 46.45it/s]

Iteration: 10, len(dl): 18731, len(du): 43000, len(dh) 0, acc: 87.91 
Iteration: 11: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2688it [00:55, 48.75it/s]


Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 19731, len(du) 43000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 19731, len(du) 43000
Iteration: 11 fine-tune the model on dh U dl
Training ...


7it [00:00, 35.81it/s]



308it [00:05, 61.90it/s]



606it [00:12, 36.43it/s]



910it [00:18, 57.18it/s]



1210it [00:24, 56.86it/s]



1234it [00:24, 49.81it/s]

====> Epoch: 0 Average loss: 0.0504
Training ...



3it [00:00, 14.77it/s]



309it [00:07, 57.32it/s]



611it [00:12, 59.65it/s]



911it [00:19, 42.73it/s]



1210it [00:25, 49.69it/s]



1234it [00:26, 47.09it/s]

====> Epoch: 1 Average loss: 0.0509
Training ...



6it [00:00, 31.23it/s]



310it [00:05, 53.98it/s]



605it [00:12, 36.93it/s]



911it [00:18, 60.96it/s]



1207it [00:23, 57.34it/s]



1234it [00:24, 51.04it/s]

====> Epoch: 2 Average loss: 0.0507
Training ...



4it [00:00, 19.13it/s]



311it [00:07, 56.17it/s]



607it [00:12, 58.88it/s]



907it [00:18, 37.42it/s]



1207it [00:25, 56.89it/s]



1234it [00:25, 47.58it/s]

====> Epoch: 3 Average loss: 0.0512
Training ...



9it [00:00, 40.88it/s]



312it [00:05, 56.65it/s]



607it [00:12, 43.58it/s]



911it [00:18, 57.86it/s]



1209it [00:23, 58.08it/s]



1234it [00:24, 50.95it/s]

====> Epoch: 4 Average loss: 0.0497
Training ...



5it [00:00, 20.87it/s]



313it [00:07, 58.78it/s]



613it [00:12, 58.49it/s]



906it [00:19, 38.84it/s]



1212it [00:25, 57.89it/s]



1234it [00:26, 46.91it/s]

====> Epoch: 5 Average loss: 0.0508
Training ...



9it [00:00, 42.30it/s]



310it [00:05, 55.38it/s]



606it [00:13, 37.11it/s]



908it [00:18, 54.56it/s]



1207it [00:24, 38.92it/s]



1234it [00:24, 49.41it/s]

====> Epoch: 6 Average loss: 0.0509
Training ...



4it [00:00, 17.14it/s]



311it [00:07, 58.17it/s]



612it [00:12, 56.56it/s]



907it [00:19, 34.09it/s]



1213it [00:25, 59.69it/s]



1234it [00:26, 47.28it/s]

====> Epoch: 7 Average loss: 0.0501
Training ...



7it [00:00, 34.13it/s]



305it [00:06, 36.56it/s]



610it [00:13, 52.00it/s]



909it [00:19, 48.77it/s]



1207it [00:27, 34.15it/s]



1234it [00:28, 43.25it/s]

====> Epoch: 8 Average loss: 0.0495
Training ...



5it [00:00, 21.02it/s]



311it [00:05, 55.51it/s]



606it [00:10, 56.28it/s]



911it [00:18, 54.01it/s]



1212it [00:23, 55.99it/s]



1234it [00:24, 51.06it/s]

====> Epoch: 9 Average loss: 0.0502
Training ...



8it [00:00, 39.43it/s]



305it [00:06, 37.92it/s]



610it [00:13, 57.26it/s]



912it [00:18, 57.46it/s]



1205it [00:25, 39.32it/s]



1234it [00:25, 47.53it/s]

====> Epoch: 10 Average loss: 0.0510
Training ...



4it [00:00, 19.73it/s]



306it [00:05, 58.62it/s]



610it [00:11, 53.37it/s]



908it [00:18, 54.33it/s]



1210it [00:23, 57.93it/s]



1234it [00:24, 50.53it/s]

====> Epoch: 11 Average loss: 0.0501
Training ...



9it [00:00, 44.68it/s]



307it [00:06, 39.62it/s]



605it [00:12, 62.59it/s]



911it [00:18, 59.69it/s]



1208it [00:25, 36.63it/s]



1234it [00:25, 47.70it/s]

====> Epoch: 12 Average loss: 0.0514
Training ...



4it [00:00, 18.27it/s]



312it [00:06, 57.21it/s]



606it [00:11, 60.10it/s]



912it [00:18, 51.54it/s]



1208it [00:24, 58.83it/s]



1234it [00:24, 49.94it/s]

====> Epoch: 13 Average loss: 0.0508
Training ...



7it [00:00, 34.44it/s]



305it [00:06, 34.42it/s]



610it [00:13, 58.99it/s]



907it [00:18, 58.00it/s]



1204it [00:25, 38.88it/s]



1234it [00:25, 47.54it/s]


====> Epoch: 14 Average loss: 0.0502
remove 1000 uncertain samples from du
Evaluation ...


625it [00:11, 54.69it/s]

Iteration: 11, len(dl): 19731, len(du): 42000, len(dh) 0, acc: 84.4 
Iteration: 12: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2625it [00:54, 48.34it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 20731, len(du) 42000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 20731, len(du) 42000
Iteration: 12 fine-tune the model on dh U dl
Training ...



5it [00:00, 19.48it/s]



313it [00:06, 60.11it/s]



612it [00:11, 56.35it/s]



911it [00:19, 45.45it/s]



1210it [00:24, 55.93it/s]



1296it [00:25, 50.12it/s]

====> Epoch: 0 Average loss: 0.0494
Training ...



7it [00:00, 33.40it/s]



305it [00:06, 37.74it/s]



611it [00:13, 58.93it/s]



910it [00:18, 56.57it/s]



1205it [00:25, 36.30it/s]



1296it [00:27, 46.72it/s]

====> Epoch: 1 Average loss: 0.0500
Training ...



9it [00:00, 44.48it/s]



307it [00:05, 61.77it/s]



606it [00:11, 36.77it/s]



910it [00:18, 60.24it/s]



1210it [00:23, 58.03it/s]



1296it [00:24, 52.39it/s]

====> Epoch: 2 Average loss: 0.0506
Training ...



8it [00:00, 43.96it/s]



310it [00:07, 46.14it/s]



610it [00:13, 57.63it/s]



912it [00:18, 56.73it/s]



1209it [00:26, 53.71it/s]



1296it [00:27, 46.73it/s]

====> Epoch: 3 Average loss: 0.0495
Training ...



7it [00:00, 34.37it/s]



310it [00:05, 59.60it/s]



606it [00:11, 42.50it/s]



911it [00:18, 56.15it/s]



1213it [00:23, 61.82it/s]



1296it [00:25, 51.41it/s]

====> Epoch: 4 Average loss: 0.0494
Training ...



4it [00:00, 19.25it/s]



308it [00:07, 58.30it/s]



607it [00:13, 56.40it/s]



907it [00:20, 35.15it/s]



1207it [00:26, 55.09it/s]



1296it [00:28, 46.01it/s]


====> Epoch: 5 Average loss: 0.0493
Training ...


9it [00:00, 41.62it/s]



305it [00:06, 35.10it/s]



608it [00:13, 55.93it/s]



910it [00:18, 59.06it/s]



1204it [00:25, 40.31it/s]



1296it [00:27, 46.89it/s]

====> Epoch: 6 Average loss: 0.0499
Training ...



5it [00:00, 23.13it/s]



308it [00:05, 57.97it/s]



610it [00:10, 53.19it/s]



906it [00:18, 52.73it/s]



1214it [00:23, 60.56it/s]



1296it [00:25, 50.92it/s]

====> Epoch: 7 Average loss: 0.0492
Training ...



7it [00:00, 34.11it/s]



307it [00:07, 32.84it/s]



611it [00:13, 57.86it/s]



910it [00:18, 54.87it/s]



1206it [00:25, 41.35it/s]



1296it [00:27, 47.09it/s]

====> Epoch: 8 Average loss: 0.0501
Training ...



6it [00:00, 29.48it/s]



313it [00:05, 60.18it/s]



605it [00:11, 33.24it/s]



911it [00:18, 58.99it/s]



1210it [00:23, 59.39it/s]



1296it [00:25, 51.21it/s]

====> Epoch: 9 Average loss: 0.0492
Training ...



6it [00:00, 29.06it/s]



312it [00:08, 56.34it/s]



611it [00:13, 59.46it/s]



905it [00:19, 39.05it/s]



1203it [00:26, 51.09it/s]



1296it [00:28, 45.10it/s]

====> Epoch: 10 Average loss: 0.0492
Training ...



7it [00:00, 36.29it/s]



311it [00:05, 54.00it/s]



608it [00:13, 38.22it/s]



907it [00:18, 58.77it/s]



1206it [00:23, 52.70it/s]



1296it [00:26, 48.98it/s]

====> Epoch: 11 Average loss: 0.0485
Training ...



5it [00:00, 24.63it/s]



308it [00:06, 56.68it/s]



612it [00:12, 58.95it/s]



906it [00:19, 42.07it/s]



1208it [00:24, 60.24it/s]



1296it [00:26, 49.63it/s]

====> Epoch: 12 Average loss: 0.0486
Training ...



8it [00:00, 39.95it/s]



307it [00:06, 38.53it/s]



613it [00:13, 58.01it/s]



911it [00:18, 58.34it/s]



1207it [00:25, 38.32it/s]



1296it [00:27, 47.15it/s]

====> Epoch: 13 Average loss: 0.0499
Training ...



6it [00:00, 27.16it/s]



310it [00:05, 56.63it/s]



606it [00:11, 35.77it/s]



909it [00:18, 55.34it/s]



1210it [00:24, 58.82it/s]



1296it [00:25, 50.62it/s]


====> Epoch: 14 Average loss: 0.0489
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 46.18it/s]

Iteration: 12, len(dl): 20731, len(du): 41000, len(dh) 0, acc: 86.87 
Iteration: 13: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2563it [00:52, 48.63it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 21731, len(du) 41000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 21731, len(du) 41000
Iteration: 13 fine-tune the model on dh U dl
Training ...



10it [00:00, 42.92it/s]



304it [00:06, 43.84it/s]



607it [00:13, 52.40it/s]



907it [00:18, 59.49it/s]



1206it [00:25, 33.51it/s]



1359it [00:29, 46.59it/s]

====> Epoch: 0 Average loss: 0.0482
Training ...



8it [00:00, 39.61it/s]



307it [00:05, 54.77it/s]



608it [00:12, 36.77it/s]



911it [00:18, 61.29it/s]



1210it [00:23, 52.74it/s]



1359it [00:27, 49.79it/s]

====> Epoch: 1 Average loss: 0.0493
Training ...



7it [00:00, 21.91it/s]



307it [00:07, 54.77it/s]



608it [00:12, 60.35it/s]



905it [00:19, 37.60it/s]



1211it [00:25, 54.28it/s]



1359it [00:28, 48.29it/s]

====> Epoch: 2 Average loss: 0.0488
Training ...



8it [00:00, 38.17it/s]



304it [00:06, 36.79it/s]



613it [00:13, 58.08it/s]



911it [00:18, 55.07it/s]



1210it [00:26, 42.11it/s]



1359it [00:29, 46.82it/s]

====> Epoch: 3 Average loss: 0.0496
Training ...



8it [00:00, 39.69it/s]



310it [00:05, 60.25it/s]



609it [00:12, 39.56it/s]



908it [00:18, 60.10it/s]



1211it [00:23, 54.68it/s]



1359it [00:27, 49.77it/s]

====> Epoch: 4 Average loss: 0.0498
Training ...



6it [00:00, 24.92it/s]



310it [00:06, 56.18it/s]



611it [00:12, 53.41it/s]



908it [00:19, 33.82it/s]



1212it [00:25, 58.09it/s]



1359it [00:28, 48.12it/s]

====> Epoch: 5 Average loss: 0.0489
Training ...



8it [00:00, 37.86it/s]



306it [00:06, 38.68it/s]



609it [00:13, 61.25it/s]



912it [00:18, 56.91it/s]



1208it [00:25, 35.51it/s]



1359it [00:29, 46.83it/s]

====> Epoch: 6 Average loss: 0.0486
Training ...



8it [00:00, 38.38it/s]



307it [00:05, 57.21it/s]



609it [00:12, 39.56it/s]



907it [00:18, 53.66it/s]



1207it [00:24, 57.00it/s]



1359it [00:27, 49.56it/s]

====> Epoch: 7 Average loss: 0.0489
Training ...



5it [00:00, 18.66it/s]



311it [00:07, 56.31it/s]



613it [00:12, 56.36it/s]



905it [00:19, 32.68it/s]



1211it [00:25, 57.35it/s]



1359it [00:28, 48.08it/s]

====> Epoch: 8 Average loss: 0.0483
Training ...



9it [00:00, 40.82it/s]



308it [00:06, 33.75it/s]



607it [00:13, 53.75it/s]



911it [00:19, 56.45it/s]



1205it [00:26, 34.47it/s]



1359it [00:30, 44.91it/s]

====> Epoch: 9 Average loss: 0.0489
Training ...



10it [00:00, 45.57it/s]



309it [00:05, 57.13it/s]



604it [00:12, 37.19it/s]



910it [00:18, 59.89it/s]



1212it [00:24, 57.16it/s]



1359it [00:27, 48.85it/s]

====> Epoch: 10 Average loss: 0.0490
Training ...



3it [00:00, 13.07it/s]



307it [00:06, 56.19it/s]



610it [00:12, 56.89it/s]



904it [00:19, 29.70it/s]



1210it [00:25, 52.14it/s]



1359it [00:28, 47.75it/s]

====> Epoch: 11 Average loss: 0.0495
Training ...



7it [00:00, 35.27it/s]



302it [00:07, 39.63it/s]



610it [00:13, 54.29it/s]



907it [00:18, 56.63it/s]



1206it [00:26, 34.59it/s]



1359it [00:29, 46.11it/s]

====> Epoch: 12 Average loss: 0.0484
Training ...



7it [00:00, 34.67it/s]



310it [00:05, 53.37it/s]



606it [00:12, 33.88it/s]



907it [00:18, 59.46it/s]



1209it [00:24, 55.88it/s]



1359it [00:28, 47.67it/s]

====> Epoch: 13 Average loss: 0.0489
Training ...



4it [00:00, 19.90it/s]



307it [00:06, 56.62it/s]



607it [00:12, 51.26it/s]



906it [00:19, 39.75it/s]



1207it [00:25, 55.36it/s]



1359it [00:28, 48.24it/s]


====> Epoch: 14 Average loss: 0.0486
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 45.05it/s]

Iteration: 13, len(dl): 21731, len(du): 40000, len(dh) 0, acc: 88.35 
Iteration: 14: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2500it [00:53, 46.87it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 22731, len(du) 40000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 22731, len(du) 40000
Iteration: 14 fine-tune the model on dh U dl
Training ...



5it [00:00, 25.15it/s]



304it [00:06, 34.86it/s]



608it [00:13, 60.73it/s]



908it [00:18, 61.49it/s]



1206it [00:25, 42.77it/s]



1421it [00:30, 46.97it/s]

====> Epoch: 0 Average loss: 0.0480
Training ...



8it [00:00, 37.84it/s]



313it [00:05, 57.03it/s]



605it [00:12, 34.73it/s]



908it [00:19, 56.10it/s]



1208it [00:24, 55.64it/s]



1421it [00:29, 47.91it/s]

====> Epoch: 1 Average loss: 0.0471
Training ...



4it [00:00, 17.48it/s]



308it [00:06, 58.27it/s]



607it [00:11, 50.16it/s]



909it [00:19, 41.70it/s]



1205it [00:25, 62.09it/s]



1421it [00:29, 47.90it/s]

====> Epoch: 2 Average loss: 0.0484
Training ...



5it [00:00, 23.57it/s]



307it [00:08, 51.44it/s]



608it [00:13, 53.74it/s]



907it [00:20, 33.72it/s]



1210it [00:27, 54.53it/s]



1421it [00:31, 44.81it/s]

====> Epoch: 3 Average loss: 0.0483
Training ...



7it [00:00, 34.10it/s]



306it [00:06, 36.05it/s]



613it [00:14, 59.05it/s]



905it [00:19, 51.36it/s]



1204it [00:26, 34.42it/s]



1421it [00:31, 45.14it/s]

====> Epoch: 4 Average loss: 0.0479
Training ...



8it [00:00, 38.57it/s]



306it [00:05, 57.16it/s]



604it [00:12, 36.60it/s]



910it [00:19, 57.44it/s]



1211it [00:24, 57.67it/s]



1421it [00:30, 46.21it/s]

====> Epoch: 5 Average loss: 0.0473
Training ...



4it [00:00, 18.71it/s]



308it [00:06, 52.43it/s]



607it [00:12, 38.59it/s]



908it [00:20, 56.70it/s]



1207it [00:25, 52.11it/s]



1421it [00:30, 47.24it/s]

====> Epoch: 6 Average loss: 0.0477
Training ...



3it [00:00, 14.11it/s]



312it [00:07, 54.16it/s]



610it [00:13, 56.05it/s]



906it [00:20, 35.80it/s]



1210it [00:26, 57.29it/s]



1421it [00:30, 46.83it/s]

====> Epoch: 7 Average loss: 0.0483
Training ...



8it [00:00, 36.10it/s]



305it [00:07, 33.36it/s]



606it [00:13, 52.77it/s]



909it [00:19, 57.59it/s]



1210it [00:27, 41.21it/s]



1421it [00:31, 45.80it/s]

====> Epoch: 8 Average loss: 0.0476
Training ...



8it [00:00, 35.98it/s]



308it [00:05, 54.59it/s]



608it [00:13, 39.12it/s]



909it [00:19, 50.87it/s]



1209it [00:25, 38.02it/s]



1421it [00:31, 45.69it/s]

====> Epoch: 9 Average loss: 0.0480
Training ...



8it [00:00, 41.59it/s]



311it [00:05, 57.92it/s]



605it [00:11, 37.03it/s]



907it [00:19, 52.07it/s]



1208it [00:24, 56.62it/s]



1421it [00:28, 49.40it/s]

====> Epoch: 10 Average loss: 0.0473
Training ...



5it [00:00, 18.36it/s]



311it [00:07, 52.00it/s]



610it [00:12, 53.78it/s]



907it [00:20, 35.75it/s]



1211it [00:26, 56.46it/s]



1421it [00:30, 46.95it/s]

====> Epoch: 11 Average loss: 0.0474
Training ...



5it [00:00, 26.29it/s]



307it [00:07, 33.47it/s]



608it [00:13, 55.67it/s]



911it [00:19, 57.10it/s]



1207it [00:27, 44.58it/s]



1421it [00:30, 45.85it/s]

====> Epoch: 12 Average loss: 0.0476
Training ...



7it [00:00, 35.88it/s]



308it [00:05, 57.66it/s]



613it [00:13, 54.39it/s]



905it [00:18, 49.31it/s]



1206it [00:24, 36.14it/s]



1421it [00:30, 46.31it/s]

====> Epoch: 13 Average loss: 0.0476
Training ...



7it [00:00, 32.96it/s]



306it [00:05, 54.10it/s]



606it [00:12, 34.28it/s]



906it [00:19, 54.36it/s]



1206it [00:25, 52.08it/s]



1421it [00:29, 47.81it/s]


====> Epoch: 14 Average loss: 0.0482
remove 1000 uncertain samples from du
Evaluation ...


625it [00:12, 49.16it/s]

Iteration: 14, len(dl): 22731, len(du): 39000, len(dh) 0, acc: 90.56 
Iteration: 15: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2438it [00:52, 46.00it/s]


Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 23731, len(du) 39000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 23731, len(du) 39000
Iteration: 15 fine-tune the model on dh U dl
Training ...


8it [00:00, 37.77it/s]



310it [00:08, 46.98it/s]



611it [00:14, 59.08it/s]



905it [00:20, 33.86it/s]



1206it [00:27, 51.12it/s]



1484it [00:32, 45.27it/s]

====> Epoch: 0 Average loss: 0.0476
Training ...



8it [00:00, 34.98it/s]



303it [00:07, 36.23it/s]



609it [00:14, 51.15it/s]



909it [00:19, 55.77it/s]



1208it [00:27, 36.71it/s]



1484it [00:32, 45.61it/s]

====> Epoch: 1 Average loss: 0.0469
Training ...



8it [00:00, 35.39it/s]



307it [00:06, 40.02it/s]



605it [00:13, 50.90it/s]



912it [00:19, 54.30it/s]



1206it [00:25, 35.23it/s]



1484it [00:32, 45.72it/s]

====> Epoch: 2 Average loss: 0.0479
Training ...



8it [00:00, 43.55it/s]



309it [00:05, 53.12it/s]



606it [00:13, 38.27it/s]



913it [00:19, 57.42it/s]



1212it [00:24, 57.47it/s]



1484it [00:31, 46.65it/s]

====> Epoch: 3 Average loss: 0.0466
Training ...



6it [00:00, 30.22it/s]



309it [00:05, 59.13it/s]



607it [00:11, 34.46it/s]



908it [00:19, 56.72it/s]



1209it [00:24, 57.99it/s]



1484it [00:30, 49.06it/s]

====> Epoch: 4 Average loss: 0.0465
Training ...



5it [00:00, 24.29it/s]



312it [00:07, 59.40it/s]



607it [00:12, 57.63it/s]



907it [00:19, 35.94it/s]



1212it [00:25, 55.29it/s]



1484it [00:30, 48.41it/s]

====> Epoch: 5 Average loss: 0.0471
Training ...



6it [00:00, 30.46it/s]



311it [00:08, 52.31it/s]



607it [00:13, 53.79it/s]



907it [00:19, 37.02it/s]



1207it [00:27, 53.00it/s]



1484it [00:32, 45.76it/s]

====> Epoch: 6 Average loss: 0.0476
Training ...



5it [00:00, 19.94it/s]



307it [00:06, 37.46it/s]



610it [00:13, 55.47it/s]



912it [00:18, 61.48it/s]



1208it [00:26, 36.91it/s]



1484it [00:32, 46.34it/s]

====> Epoch: 7 Average loss: 0.0467
Training ...



8it [00:00, 35.23it/s]



304it [00:05, 51.03it/s]



608it [00:13, 55.65it/s]



912it [00:19, 53.46it/s]



1207it [00:25, 35.72it/s]



1484it [00:32, 45.70it/s]

====> Epoch: 8 Average loss: 0.0465
Training ...



7it [00:00, 34.27it/s]



311it [00:05, 56.14it/s]



606it [00:12, 42.07it/s]



908it [00:19, 56.61it/s]



1212it [00:24, 53.78it/s]



1484it [00:31, 46.79it/s]

====> Epoch: 9 Average loss: 0.0478
Training ...



5it [00:00, 18.91it/s]



309it [00:06, 54.21it/s]



606it [00:11, 45.01it/s]



909it [00:19, 54.21it/s]



1209it [00:25, 52.61it/s]



1484it [00:30, 48.02it/s]

====> Epoch: 10 Average loss: 0.0474
Training ...



4it [00:00, 17.83it/s]



308it [00:07, 56.04it/s]



608it [00:12, 58.02it/s]



905it [00:19, 33.05it/s]



1210it [00:25, 57.17it/s]



1484it [00:30, 48.04it/s]

====> Epoch: 11 Average loss: 0.0481
Training ...



7it [00:00, 32.27it/s]



311it [00:08, 52.39it/s]



606it [00:13, 51.14it/s]



907it [00:20, 30.75it/s]



1210it [00:27, 54.58it/s]



1484it [00:32, 45.46it/s]

====> Epoch: 12 Average loss: 0.0477
Training ...



6it [00:00, 29.53it/s]



305it [00:07, 36.77it/s]



611it [00:13, 56.93it/s]



911it [00:19, 57.40it/s]



1206it [00:26, 35.30it/s]



1484it [00:32, 45.78it/s]

====> Epoch: 13 Average loss: 0.0475
Training ...



7it [00:00, 32.49it/s]



307it [00:05, 50.40it/s]



611it [00:13, 52.14it/s]



911it [00:19, 53.48it/s]



1207it [00:25, 36.04it/s]



1484it [00:32, 45.83it/s]


====> Epoch: 14 Average loss: 0.0475
remove 1000 uncertain samples from du
Evaluation ...


625it [00:12, 48.24it/s]

Iteration: 15, len(dl): 23731, len(du): 38000, len(dh) 0, acc: 86.72 
Iteration: 16: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2375it [00:50, 47.29it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 24731, len(du) 38000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 24731, len(du) 38000
Iteration: 16 fine-tune the model on dh U dl
Training ...



5it [00:00, 19.45it/s]



309it [00:06, 55.35it/s]



609it [00:12, 54.07it/s]



905it [00:20, 36.51it/s]



1212it [00:25, 57.12it/s]



1507it [00:31, 45.17it/s]



1546it [00:32, 47.78it/s]

====> Epoch: 0 Average loss: 0.0464
Training ...



5it [00:00, 19.14it/s]



311it [00:07, 54.92it/s]



611it [00:13, 53.40it/s]



906it [00:20, 37.54it/s]



1207it [00:26, 53.32it/s]



1511it [00:32, 59.02it/s]



1546it [00:32, 47.08it/s]

====> Epoch: 1 Average loss: 0.0462
Training ...



5it [00:00, 16.89it/s]



308it [00:08, 50.78it/s]



607it [00:13, 58.20it/s]



906it [00:20, 36.26it/s]



1212it [00:27, 55.22it/s]



1512it [00:32, 57.55it/s]



1546it [00:33, 46.73it/s]

====> Epoch: 2 Average loss: 0.0467
Training ...



6it [00:00, 24.73it/s]



307it [00:08, 40.95it/s]



613it [00:14, 57.26it/s]



905it [00:20, 31.14it/s]



1207it [00:27, 50.29it/s]



1506it [00:32, 56.28it/s]



1546it [00:33, 46.07it/s]


====> Epoch: 3 Average loss: 0.0460
Training ...


7it [00:00, 34.47it/s]



306it [00:07, 34.59it/s]



611it [00:13, 58.28it/s]



907it [00:19, 57.29it/s]



1205it [00:27, 35.79it/s]



1507it [00:32, 53.80it/s]



1546it [00:33, 45.87it/s]

====> Epoch: 4 Average loss: 0.0475
Training ...



5it [00:00, 24.45it/s]



307it [00:06, 36.05it/s]



608it [00:13, 58.88it/s]



912it [00:19, 54.99it/s]



1206it [00:26, 37.52it/s]



1511it [00:32, 54.35it/s]



1546it [00:33, 46.08it/s]

====> Epoch: 5 Average loss: 0.0462
Training ...



9it [00:00, 44.89it/s]



307it [00:05, 39.97it/s]



613it [00:13, 55.11it/s]



908it [00:19, 51.66it/s]



1208it [00:25, 34.69it/s]



1508it [00:32, 55.44it/s]



1546it [00:33, 45.88it/s]

====> Epoch: 6 Average loss: 0.0460
Training ...



9it [00:00, 43.55it/s]



309it [00:05, 53.30it/s]



605it [00:13, 34.38it/s]



911it [00:19, 56.32it/s]



1207it [00:24, 52.30it/s]



1513it [00:33, 49.28it/s]



1546it [00:34, 45.39it/s]

====> Epoch: 7 Average loss: 0.0467
Training ...



7it [00:00, 31.41it/s]



310it [00:05, 56.37it/s]



608it [00:12, 37.90it/s]



908it [00:19, 57.39it/s]



1207it [00:24, 54.76it/s]



1506it [00:32, 36.94it/s]



1546it [00:33, 46.05it/s]

====> Epoch: 8 Average loss: 0.0466
Training ...



4it [00:00, 17.07it/s]



312it [00:05, 53.33it/s]



605it [00:11, 39.58it/s]



905it [00:19, 47.19it/s]



1209it [00:24, 56.11it/s]



1509it [00:31, 37.12it/s]



1546it [00:32, 47.88it/s]

====> Epoch: 9 Average loss: 0.0472
Training ...



4it [00:00, 18.22it/s]



309it [00:06, 54.69it/s]



605it [00:12, 52.49it/s]



910it [00:20, 49.44it/s]



1210it [00:25, 56.85it/s]



1508it [00:31, 39.59it/s]



1546it [00:32, 47.09it/s]

====> Epoch: 10 Average loss: 0.0457
Training ...



5it [00:00, 19.77it/s]



310it [00:06, 55.30it/s]



607it [00:12, 51.62it/s]



907it [00:20, 38.54it/s]



1210it [00:26, 51.45it/s]



1508it [00:31, 38.73it/s]



1546it [00:32, 46.93it/s]

====> Epoch: 11 Average loss: 0.0464
Training ...



5it [00:00, 16.60it/s]



313it [00:07, 54.52it/s]



607it [00:12, 57.89it/s]



905it [00:20, 33.37it/s]



1208it [00:26, 53.08it/s]



1510it [00:31, 53.70it/s]



1546it [00:33, 46.80it/s]

====> Epoch: 12 Average loss: 0.0462
Training ...



3it [00:00, 12.27it/s]



311it [00:07, 55.20it/s]



611it [00:13, 50.11it/s]



907it [00:20, 38.50it/s]



1207it [00:27, 53.80it/s]



1512it [00:32, 64.02it/s]



1546it [00:33, 45.85it/s]

====> Epoch: 13 Average loss: 0.0459
Training ...



5it [00:00, 20.44it/s]



310it [00:07, 56.40it/s]



610it [00:13, 55.65it/s]



905it [00:20, 40.97it/s]



1208it [00:26, 48.33it/s]



1508it [00:32, 55.49it/s]



1546it [00:33, 46.82it/s]


====> Epoch: 14 Average loss: 0.0472
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 45.48it/s]

Iteration: 16, len(dl): 24731, len(du): 37000, len(dh) 0, acc: 88.86 
Iteration: 17: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2313it [00:50, 45.39it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 25731, len(du) 37000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 25731, len(du) 37000
Iteration: 17 fine-tune the model on dh U dl
Training ...



6it [00:00, 28.73it/s]



307it [00:06, 35.18it/s]



612it [00:14, 56.02it/s]



906it [00:19, 57.68it/s]



1204it [00:27, 33.41it/s]



1507it [00:33, 53.80it/s]



1609it [00:35, 45.06it/s]

====> Epoch: 0 Average loss: 0.0448
Training ...



7it [00:00, 33.12it/s]



308it [00:07, 35.83it/s]



610it [00:14, 54.20it/s]



910it [00:19, 55.49it/s]



1205it [00:27, 38.45it/s]



1508it [00:33, 57.92it/s]



1609it [00:35, 45.49it/s]

====> Epoch: 1 Average loss: 0.0464
Training ...



6it [00:00, 30.67it/s]



306it [00:07, 40.13it/s]



608it [00:14, 52.22it/s]



908it [00:19, 52.79it/s]



1205it [00:26, 34.81it/s]



1506it [00:33, 51.33it/s]



1609it [00:35, 45.95it/s]

====> Epoch: 2 Average loss: 0.0452
Training ...



7it [00:00, 36.31it/s]



307it [00:07, 36.74it/s]



609it [00:14, 52.82it/s]



907it [00:19, 58.19it/s]



1206it [00:26, 37.10it/s]



1511it [00:33, 57.58it/s]



1609it [00:35, 45.93it/s]

====> Epoch: 3 Average loss: 0.0459
Training ...



7it [00:00, 32.00it/s]



306it [00:06, 36.40it/s]



607it [00:13, 52.79it/s]



909it [00:19, 55.21it/s]



1206it [00:26, 37.36it/s]



1509it [00:33, 55.13it/s]



1609it [00:34, 45.98it/s]

====> Epoch: 4 Average loss: 0.0463
Training ...



7it [00:00, 35.75it/s]



306it [00:06, 36.44it/s]



612it [00:13, 56.25it/s]



913it [00:19, 54.75it/s]



1206it [00:26, 35.02it/s]



1508it [00:33, 58.33it/s]



1609it [00:35, 45.74it/s]

====> Epoch: 5 Average loss: 0.0459
Training ...



7it [00:00, 34.24it/s]



305it [00:06, 36.60it/s]



609it [00:13, 52.69it/s]



906it [00:19, 57.37it/s]



1205it [00:25, 33.78it/s]



1509it [00:32, 52.68it/s]



1609it [00:34, 46.24it/s]

====> Epoch: 6 Average loss: 0.0466
Training ...



6it [00:00, 29.01it/s]



305it [00:05, 39.91it/s]



611it [00:14, 55.15it/s]



907it [00:19, 55.10it/s]



1205it [00:25, 35.61it/s]



1508it [00:33, 58.47it/s]



1609it [00:35, 45.90it/s]

====> Epoch: 7 Average loss: 0.0462
Training ...



8it [00:00, 36.88it/s]



308it [00:05, 49.85it/s]



604it [00:13, 34.77it/s]



909it [00:19, 56.04it/s]



1207it [00:25, 36.17it/s]



1507it [00:33, 54.80it/s]



1609it [00:35, 45.78it/s]

====> Epoch: 8 Average loss: 0.0460
Training ...



6it [00:00, 29.31it/s]



310it [00:05, 52.76it/s]



606it [00:13, 36.20it/s]



909it [00:19, 52.96it/s]



1204it [00:25, 33.41it/s]



1512it [00:33, 57.41it/s]



1609it [00:35, 45.20it/s]

====> Epoch: 9 Average loss: 0.0459
Training ...



8it [00:00, 38.99it/s]



309it [00:05, 54.03it/s]



607it [00:14, 35.28it/s]



907it [00:19, 55.13it/s]



1207it [00:25, 35.51it/s]



1510it [00:34, 53.67it/s]



1609it [00:36, 44.62it/s]

====> Epoch: 10 Average loss: 0.0453
Training ...



7it [00:00, 36.15it/s]



307it [00:05, 53.21it/s]



603it [00:13, 40.16it/s]



910it [00:19, 52.22it/s]



1207it [00:25, 33.37it/s]



1511it [00:33, 59.42it/s]



1609it [00:35, 45.19it/s]

====> Epoch: 11 Average loss: 0.0460
Training ...



8it [00:00, 42.88it/s]



309it [00:05, 52.85it/s]



609it [00:13, 43.87it/s]



910it [00:19, 56.08it/s]



1209it [00:25, 36.97it/s]



1509it [00:33, 55.25it/s]



1609it [00:34, 46.16it/s]

====> Epoch: 12 Average loss: 0.0456
Training ...



8it [00:00, 38.40it/s]



312it [00:05, 55.89it/s]



608it [00:13, 34.84it/s]



908it [00:19, 57.03it/s]



1205it [00:25, 35.94it/s]



1509it [00:33, 59.01it/s]



1609it [00:35, 45.52it/s]

====> Epoch: 13 Average loss: 0.0457
Training ...



8it [00:00, 40.70it/s]



306it [00:05, 63.12it/s]



607it [00:13, 36.55it/s]



907it [00:19, 54.49it/s]



1205it [00:24, 62.05it/s]



1509it [00:33, 47.40it/s]



1609it [00:35, 45.81it/s]


====> Epoch: 14 Average loss: 0.0461
remove 1000 uncertain samples from du
Evaluation ...


625it [00:14, 43.80it/s]

Iteration: 17, len(dl): 25731, len(du): 36000, len(dh) 0, acc: 86.31 
Iteration: 18: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2250it [00:48, 46.54it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 26731, len(du) 36000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 26731, len(du) 36000
Iteration: 18 fine-tune the model on dh U dl
Training ...



5it [00:00, 17.56it/s]



311it [00:07, 53.88it/s]



607it [00:12, 59.89it/s]



909it [00:20, 37.68it/s]



1208it [00:26, 55.87it/s]



1507it [00:31, 36.41it/s]



1671it [00:36, 45.65it/s]

====> Epoch: 0 Average loss: 0.0456
Training ...



5it [00:00, 21.39it/s]



312it [00:06, 56.78it/s]



607it [00:12, 42.01it/s]



908it [00:20, 51.55it/s]



1209it [00:25, 53.94it/s]



1507it [00:32, 38.26it/s]



1671it [00:37, 44.83it/s]

====> Epoch: 1 Average loss: 0.0450
Training ...



7it [00:00, 33.04it/s]



309it [00:05, 54.49it/s]



604it [00:12, 31.06it/s]



908it [00:19, 56.91it/s]



1209it [00:25, 53.69it/s]



1507it [00:32, 35.99it/s]



1671it [00:36, 45.34it/s]

====> Epoch: 2 Average loss: 0.0454
Training ...



8it [00:00, 38.10it/s]



306it [00:05, 51.53it/s]



604it [00:13, 34.08it/s]



908it [00:20, 55.32it/s]



1210it [00:25, 53.88it/s]



1507it [00:33, 38.55it/s]



1671it [00:37, 45.14it/s]

====> Epoch: 3 Average loss: 0.0446
Training ...



7it [00:00, 34.96it/s]



311it [00:05, 52.90it/s]



607it [00:14, 35.04it/s]



910it [00:19, 49.73it/s]



1208it [00:26, 34.55it/s]



1508it [00:34, 52.97it/s]



1671it [00:37, 44.72it/s]

====> Epoch: 4 Average loss: 0.0461
Training ...



6it [00:00, 29.66it/s]



306it [00:06, 33.88it/s]



604it [00:14, 45.41it/s]



911it [00:20, 52.73it/s]



1206it [00:27, 34.62it/s]



1510it [00:34, 56.83it/s]



1671it [00:37, 44.33it/s]

====> Epoch: 5 Average loss: 0.0456
Training ...



7it [00:00, 34.32it/s]



304it [00:06, 32.11it/s]



608it [00:14, 55.31it/s]



913it [00:20, 51.57it/s]



1206it [00:27, 33.84it/s]



1504it [00:34, 48.87it/s]



1671it [00:37, 44.89it/s]

====> Epoch: 6 Average loss: 0.0453
Training ...



8it [00:00, 38.85it/s]



308it [00:07, 37.87it/s]



611it [00:14, 53.67it/s]



909it [00:20, 55.45it/s]



1204it [00:28, 38.16it/s]



1508it [00:34, 54.21it/s]



1671it [00:37, 44.96it/s]

====> Epoch: 7 Average loss: 0.0454
Training ...



7it [00:00, 35.17it/s]



307it [00:08, 32.94it/s]



608it [00:14, 54.28it/s]



906it [00:20, 47.39it/s]



1207it [00:28, 49.11it/s]



1511it [00:34, 56.63it/s]



1671it [00:37, 44.78it/s]

====> Epoch: 8 Average loss: 0.0456
Training ...



7it [00:00, 37.76it/s]



307it [00:08, 46.35it/s]



609it [00:14, 56.61it/s]



906it [00:20, 34.27it/s]



1206it [00:28, 52.24it/s]



1509it [00:34, 51.62it/s]



1671it [00:37, 44.52it/s]

====> Epoch: 9 Average loss: 0.0457
Training ...



4it [00:00, 16.21it/s]



309it [00:08, 52.70it/s]



606it [00:13, 59.42it/s]



902it [00:21, 43.05it/s]



1210it [00:28, 53.89it/s]



1508it [00:33, 54.91it/s]



1671it [00:38, 43.93it/s]

====> Epoch: 10 Average loss: 0.0455
Training ...



3it [00:00, 13.90it/s]



310it [00:07, 50.84it/s]



607it [00:13, 47.21it/s]



911it [00:22, 44.15it/s]



1211it [00:28, 53.39it/s]



1508it [00:35, 33.03it/s]



1671it [00:40, 41.69it/s]

====> Epoch: 11 Average loss: 0.0454
Training ...



8it [00:00, 39.19it/s]



312it [00:06, 50.09it/s]



607it [00:13, 33.73it/s]



910it [00:20, 51.08it/s]



1211it [00:26, 49.72it/s]



1504it [00:34, 33.66it/s]



1671it [00:38, 43.50it/s]

====> Epoch: 12 Average loss: 0.0453
Training ...



7it [00:00, 33.00it/s]



306it [00:05, 55.80it/s]



606it [00:13, 32.04it/s]



909it [00:20, 52.13it/s]



1205it [00:26, 39.07it/s]



1509it [00:34, 52.66it/s]



1671it [00:38, 43.89it/s]

====> Epoch: 13 Average loss: 0.0452
Training ...



6it [00:00, 30.72it/s]



308it [00:06, 43.18it/s]



608it [00:14, 48.04it/s]



906it [00:20, 52.39it/s]



1206it [00:27, 32.75it/s]



1509it [00:35, 50.19it/s]



1671it [00:38, 43.68it/s]


====> Epoch: 14 Average loss: 0.0458
remove 1000 uncertain samples from du
Evaluation ...


625it [00:15, 41.62it/s]

Iteration: 18, len(dl): 26731, len(du): 35000, len(dh) 0, acc: 90.72 
Iteration: 19: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2188it [00:49, 44.01it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 27731, len(du) 35000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 27731, len(du) 35000
Iteration: 19 fine-tune the model on dh U dl
Training ...



5it [00:00, 21.66it/s]



311it [00:07, 50.06it/s]



606it [00:13, 35.75it/s]



910it [00:21, 51.59it/s]



1211it [00:27, 52.70it/s]



1507it [00:34, 35.87it/s]



1734it [00:40, 43.07it/s]

====> Epoch: 0 Average loss: 0.0446
Training ...



7it [00:00, 30.26it/s]



312it [00:06, 53.50it/s]



608it [00:13, 36.11it/s]



909it [00:20, 52.72it/s]



1210it [00:26, 51.82it/s]



1505it [00:34, 35.03it/s]



1734it [00:39, 44.14it/s]

====> Epoch: 1 Average loss: 0.0445
Training ...



7it [00:00, 33.38it/s]



306it [00:06, 41.04it/s]



605it [00:14, 51.25it/s]



907it [00:20, 52.21it/s]



1205it [00:27, 33.68it/s]



1511it [00:35, 54.46it/s]



1734it [00:39, 44.07it/s]

====> Epoch: 2 Average loss: 0.0447
Training ...



7it [00:00, 34.87it/s]



306it [00:07, 33.56it/s]



612it [00:14, 51.19it/s]



908it [00:20, 52.91it/s]



1208it [00:28, 34.98it/s]



1508it [00:34, 53.64it/s]



1734it [00:39, 44.28it/s]

====> Epoch: 3 Average loss: 0.0447
Training ...



7it [00:00, 33.93it/s]



309it [00:09, 43.48it/s]



612it [00:14, 54.30it/s]



907it [00:21, 34.74it/s]



1211it [00:29, 48.04it/s]



1508it [00:34, 53.62it/s]



1734it [00:39, 43.59it/s]

====> Epoch: 4 Average loss: 0.0442
Training ...



4it [00:00, 19.23it/s]



309it [00:07, 56.00it/s]



607it [00:12, 57.18it/s]



905it [00:20, 35.95it/s]



1212it [00:26, 56.07it/s]



1509it [00:32, 39.99it/s]



1734it [00:38, 44.54it/s]

====> Epoch: 5 Average loss: 0.0445
Training ...



5it [00:00, 21.90it/s]



310it [00:06, 53.26it/s]



607it [00:12, 34.60it/s]



909it [00:20, 52.59it/s]



1211it [00:25, 54.25it/s]



1504it [00:32, 40.69it/s]



1734it [00:38, 44.88it/s]

====> Epoch: 6 Average loss: 0.0450
Training ...



7it [00:00, 32.48it/s]



307it [00:05, 51.22it/s]



607it [00:13, 36.25it/s]



911it [00:20, 53.39it/s]



1207it [00:25, 54.45it/s]



1506it [00:33, 35.85it/s]



1734it [00:38, 44.82it/s]

====> Epoch: 7 Average loss: 0.0449
Training ...



7it [00:00, 32.61it/s]



307it [00:05, 53.96it/s]



607it [00:14, 39.83it/s]



909it [00:19, 52.29it/s]



1203it [00:26, 32.32it/s]



1509it [00:34, 54.82it/s]



1734it [00:38, 44.97it/s]

====> Epoch: 8 Average loss: 0.0446
Training ...



7it [00:00, 37.77it/s]



304it [00:06, 35.88it/s]



608it [00:14, 53.48it/s]



906it [00:20, 52.73it/s]



1207it [00:28, 30.86it/s]



1507it [00:34, 50.28it/s]



1734it [00:38, 44.72it/s]

====> Epoch: 9 Average loss: 0.0445
Training ...



7it [00:00, 31.06it/s]



306it [00:08, 34.21it/s]



608it [00:14, 54.00it/s]



908it [00:20, 35.52it/s]



1206it [00:28, 41.50it/s]



1510it [00:34, 52.10it/s]



1734it [00:39, 43.90it/s]

====> Epoch: 10 Average loss: 0.0444
Training ...



5it [00:00, 20.22it/s]



311it [00:07, 54.02it/s]



607it [00:13, 52.96it/s]



905it [00:21, 33.07it/s]



1208it [00:27, 53.90it/s]



1506it [00:34, 33.28it/s]



1734it [00:40, 42.72it/s]

====> Epoch: 11 Average loss: 0.0447
Training ...



5it [00:00, 26.97it/s]



310it [00:06, 52.82it/s]



604it [00:12, 35.20it/s]



907it [00:20, 59.41it/s]



1208it [00:25, 53.71it/s]



1505it [00:33, 34.99it/s]



1734it [00:39, 44.40it/s]

====> Epoch: 12 Average loss: 0.0452
Training ...



6it [00:00, 31.48it/s]



311it [00:06, 52.57it/s]



607it [00:14, 32.55it/s]



907it [00:20, 53.23it/s]



1210it [00:26, 48.76it/s]



1510it [00:34, 46.12it/s]



1734it [00:39, 44.40it/s]

====> Epoch: 13 Average loss: 0.0448
Training ...



7it [00:00, 32.14it/s]



308it [00:06, 35.81it/s]



609it [00:14, 54.43it/s]



907it [00:20, 53.60it/s]



1206it [00:27, 31.55it/s]



1508it [00:34, 50.43it/s]



1734it [00:39, 44.28it/s]


====> Epoch: 14 Average loss: 0.0451
remove 1000 uncertain samples from du
Evaluation ...


625it [00:14, 42.38it/s]

Iteration: 19, len(dl): 27731, len(du): 34000, len(dh) 0, acc: 91.14 
Iteration: 20: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2125it [00:49, 42.87it/s]


Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 28731, len(du) 34000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 28731, len(du) 34000
Iteration: 20 fine-tune the model on dh U dl
Training ...


9it [00:00, 39.14it/s]



308it [00:06, 52.99it/s]



606it [00:13, 36.00it/s]



913it [00:20, 56.78it/s]



1212it [00:26, 56.37it/s]



1508it [00:34, 38.80it/s]



1796it [00:40, 44.36it/s]

====> Epoch: 0 Average loss: 0.0437
Training ...



7it [00:00, 35.22it/s]



309it [00:06, 38.56it/s]



609it [00:14, 51.60it/s]



911it [00:20, 54.07it/s]



1204it [00:27, 36.19it/s]



1506it [00:34, 50.57it/s]



1796it [00:39, 44.94it/s]

====> Epoch: 1 Average loss: 0.0435
Training ...



9it [00:00, 40.67it/s]



307it [00:08, 33.43it/s]



607it [00:14, 53.60it/s]



907it [00:21, 31.74it/s]



1211it [00:29, 51.55it/s]



1508it [00:34, 51.53it/s]



1796it [00:42, 42.66it/s]

====> Epoch: 2 Average loss: 0.0450
Training ...



5it [00:00, 19.61it/s]



311it [00:06, 55.73it/s]



606it [00:12, 43.97it/s]



910it [00:20, 51.97it/s]



1210it [00:26, 51.73it/s]



1507it [00:33, 35.08it/s]



1796it [00:40, 44.27it/s]

====> Epoch: 3 Average loss: 0.0431
Training ...



7it [00:00, 36.24it/s]



308it [00:06, 53.53it/s]



605it [00:14, 33.92it/s]



908it [00:20, 52.37it/s]



1205it [00:26, 38.01it/s]



1511it [00:34, 49.49it/s]



1796it [00:40, 44.78it/s]

====> Epoch: 4 Average loss: 0.0436
Training ...



4it [00:00, 19.49it/s]



305it [00:07, 33.41it/s]



613it [00:14, 55.39it/s]



910it [00:20, 52.47it/s]



1206it [00:28, 36.86it/s]



1507it [00:34, 53.71it/s]



1796it [00:40, 43.81it/s]

====> Epoch: 5 Average loss: 0.0441
Training ...



5it [00:00, 21.18it/s]



310it [00:07, 56.27it/s]



610it [00:13, 55.05it/s]



906it [00:20, 37.29it/s]



1208it [00:27, 52.13it/s]



1505it [00:33, 53.20it/s]



1796it [00:41, 43.20it/s]

====> Epoch: 6 Average loss: 0.0435
Training ...



8it [00:00, 40.31it/s]



311it [00:06, 52.12it/s]



606it [00:12, 30.89it/s]



911it [00:20, 50.73it/s]



1212it [00:26, 55.89it/s]



1506it [00:34, 31.00it/s]



1796it [00:40, 44.14it/s]

====> Epoch: 7 Average loss: 0.0433
Training ...



7it [00:00, 31.80it/s]



305it [00:06, 32.03it/s]



609it [00:14, 46.97it/s]



910it [00:20, 50.38it/s]



1206it [00:27, 36.88it/s]



1510it [00:34, 53.46it/s]



1796it [00:40, 44.54it/s]

====> Epoch: 8 Average loss: 0.0435
Training ...



6it [00:00, 29.79it/s]



307it [00:08, 33.87it/s]



606it [00:14, 42.73it/s]



907it [00:20, 35.44it/s]



1209it [00:28, 54.74it/s]



1511it [00:34, 55.41it/s]



1796it [00:41, 42.98it/s]

====> Epoch: 9 Average loss: 0.0448
Training ...



5it [00:00, 18.99it/s]



308it [00:07, 53.47it/s]



612it [00:12, 56.03it/s]



908it [00:21, 51.25it/s]



1212it [00:27, 51.54it/s]



1505it [00:33, 34.93it/s]



1796it [00:41, 43.66it/s]

====> Epoch: 10 Average loss: 0.0440
Training ...



6it [00:00, 31.21it/s]



309it [00:06, 54.20it/s]



605it [00:13, 34.05it/s]



911it [00:20, 52.39it/s]



1208it [00:26, 39.00it/s]



1506it [00:34, 49.89it/s]



1796it [00:40, 44.61it/s]

====> Epoch: 11 Average loss: 0.0439
Training ...



6it [00:00, 29.40it/s]



304it [00:07, 32.97it/s]



610it [00:14, 54.13it/s]



906it [00:20, 48.79it/s]



1207it [00:28, 32.80it/s]



1508it [00:34, 51.28it/s]



1796it [00:40, 44.37it/s]

====> Epoch: 12 Average loss: 0.0440
Training ...



3it [00:00, 12.39it/s]



307it [00:08, 53.72it/s]



612it [00:14, 53.88it/s]



907it [00:21, 32.61it/s]



1208it [00:28, 54.80it/s]



1511it [00:34, 49.16it/s]



1796it [00:42, 42.18it/s]

====> Epoch: 13 Average loss: 0.0438
Training ...



5it [00:00, 22.96it/s]



311it [00:06, 54.36it/s]



605it [00:12, 34.67it/s]



909it [00:20, 50.81it/s]



1208it [00:26, 55.99it/s]



1506it [00:33, 37.99it/s]



1796it [00:40, 44.22it/s]


====> Epoch: 14 Average loss: 0.0439
remove 1000 uncertain samples from du
Evaluation ...


625it [00:15, 41.53it/s]

Iteration: 20, len(dl): 28731, len(du): 33000, len(dh) 0, acc: 86.03 
Iteration: 21: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2063it [00:45, 45.58it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 29731, len(du) 33000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 29731, len(du) 33000
Iteration: 21 fine-tune the model on dh U dl
Training ...



5it [00:00, 24.12it/s]



305it [00:08, 37.97it/s]



610it [00:14, 52.98it/s]



907it [00:21, 32.69it/s]



1210it [00:29, 54.77it/s]



1512it [00:35, 52.64it/s]



1806it [00:42, 31.80it/s]



1859it [00:44, 42.00it/s]

====> Epoch: 0 Average loss: 0.0432
Training ...



5it [00:00, 21.28it/s]



309it [00:06, 55.91it/s]



608it [00:12, 33.87it/s]



911it [00:20, 49.84it/s]



1210it [00:26, 55.36it/s]



1506it [00:33, 31.43it/s]



1811it [00:40, 52.45it/s]



1859it [00:41, 44.76it/s]

====> Epoch: 1 Average loss: 0.0435
Training ...



8it [00:00, 36.35it/s]



306it [00:06, 33.16it/s]



609it [00:14, 53.62it/s]



911it [00:20, 51.56it/s]



1209it [00:27, 35.12it/s]



1507it [00:34, 52.65it/s]



1811it [00:40, 50.89it/s]



1859it [00:41, 44.42it/s]

====> Epoch: 2 Average loss: 0.0432
Training ...



5it [00:00, 19.04it/s]



309it [00:08, 54.00it/s]



608it [00:14, 45.15it/s]



905it [00:21, 34.52it/s]



1207it [00:28, 55.10it/s]



1513it [00:34, 56.22it/s]



1809it [00:42, 37.55it/s]



1859it [00:43, 42.57it/s]

====> Epoch: 3 Average loss: 0.0432
Training ...



6it [00:00, 30.26it/s]



312it [00:06, 54.05it/s]



607it [00:12, 38.91it/s]



913it [00:20, 53.76it/s]



1209it [00:26, 44.84it/s]



1505it [00:34, 31.75it/s]



1810it [00:40, 50.01it/s]



1859it [00:41, 44.35it/s]

====> Epoch: 4 Average loss: 0.0433
Training ...



8it [00:00, 37.59it/s]



307it [00:06, 35.35it/s]



610it [00:14, 51.38it/s]



909it [00:20, 53.29it/s]



1205it [00:28, 33.31it/s]



1508it [00:35, 52.80it/s]



1808it [00:41, 51.45it/s]



1859it [00:42, 43.56it/s]

====> Epoch: 5 Average loss: 0.0442
Training ...



4it [00:00, 17.30it/s]



307it [00:08, 51.19it/s]



611it [00:14, 52.65it/s]



907it [00:21, 31.42it/s]



1207it [00:28, 53.50it/s]



1508it [00:34, 55.30it/s]



1806it [00:42, 34.75it/s]



1859it [00:43, 42.42it/s]

====> Epoch: 6 Average loss: 0.0429
Training ...



7it [00:00, 35.51it/s]



312it [00:06, 53.21it/s]



609it [00:13, 37.59it/s]



906it [00:20, 51.28it/s]



1204it [00:26, 54.05it/s]



1504it [00:34, 32.26it/s]



1811it [00:40, 54.61it/s]



1859it [00:41, 44.59it/s]

====> Epoch: 7 Average loss: 0.0434
Training ...



7it [00:00, 36.68it/s]



306it [00:07, 36.33it/s]



607it [00:14, 53.10it/s]



906it [00:20, 52.50it/s]



1205it [00:28, 33.47it/s]



1507it [00:35, 38.80it/s]



1807it [00:41, 39.91it/s]



1859it [00:42, 43.40it/s]

====> Epoch: 8 Average loss: 0.0434
Training ...



5it [00:00, 18.85it/s]



309it [00:07, 55.19it/s]



608it [00:13, 54.02it/s]



905it [00:21, 33.62it/s]



1207it [00:28, 56.27it/s]



1506it [00:34, 31.63it/s]



1807it [00:42, 36.34it/s]



1859it [00:43, 42.71it/s]

====> Epoch: 9 Average loss: 0.0435
Training ...



7it [00:00, 33.84it/s]



305it [00:06, 41.06it/s]



607it [00:14, 34.35it/s]



908it [00:20, 51.74it/s]



1205it [00:26, 38.88it/s]



1506it [00:35, 46.66it/s]



1811it [00:41, 49.25it/s]



1859it [00:42, 43.95it/s]

====> Epoch: 10 Average loss: 0.0432
Training ...



7it [00:00, 32.93it/s]



305it [00:08, 32.94it/s]



611it [00:14, 53.53it/s]



906it [00:20, 54.45it/s]



1207it [00:29, 35.13it/s]



1512it [00:35, 54.21it/s]



1805it [00:41, 32.49it/s]



1859it [00:43, 42.71it/s]

====> Epoch: 11 Average loss: 0.0434
Training ...



4it [00:00, 20.81it/s]



308it [00:07, 53.01it/s]



607it [00:13, 36.49it/s]



905it [00:21, 32.22it/s]



1207it [00:27, 53.37it/s]



1504it [00:33, 34.70it/s]



1808it [00:41, 54.84it/s]



1859it [00:42, 43.40it/s]

====> Epoch: 12 Average loss: 0.0436
Training ...



7it [00:00, 35.32it/s]



308it [00:06, 50.96it/s]



607it [00:14, 33.93it/s]



909it [00:20, 52.31it/s]



1206it [00:27, 31.31it/s]



1510it [00:35, 54.67it/s]



1814it [00:41, 55.38it/s]



1859it [00:42, 43.80it/s]

====> Epoch: 13 Average loss: 0.0433
Training ...



7it [00:00, 32.20it/s]



306it [00:08, 37.27it/s]



611it [00:15, 49.33it/s]



904it [00:21, 40.11it/s]



1211it [00:29, 48.56it/s]



1507it [00:35, 53.55it/s]



1807it [00:42, 34.71it/s]



1859it [00:44, 42.21it/s]


====> Epoch: 14 Average loss: 0.0432
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 45.39it/s]

Iteration: 21, len(dl): 29731, len(du): 32000, len(dh) 0, acc: 87.04 
Iteration: 22: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



2000it [00:46, 42.95it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 30731, len(du) 32000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 30731, len(du) 32000
Iteration: 22 fine-tune the model on dh U dl
Training ...



6it [00:00, 29.85it/s]



308it [00:07, 36.48it/s]



606it [00:15, 48.90it/s]



906it [00:20, 52.59it/s]



1206it [00:28, 36.33it/s]



1507it [00:35, 54.24it/s]



1809it [00:41, 52.49it/s]



1921it [00:44, 43.22it/s]

====> Epoch: 0 Average loss: 0.0432
Training ...



5it [00:00, 20.09it/s]



308it [00:07, 55.25it/s]



607it [00:13, 53.06it/s]



905it [00:22, 30.90it/s]



1207it [00:28, 51.07it/s]



1504it [00:35, 32.58it/s]



1809it [00:43, 50.81it/s]



1921it [00:46, 41.69it/s]

====> Epoch: 1 Average loss: 0.0431
Training ...



7it [00:00, 34.81it/s]



307it [00:06, 36.41it/s]



607it [00:15, 45.21it/s]



908it [00:20, 53.58it/s]



1205it [00:28, 34.89it/s]



1509it [00:35, 54.10it/s]



1812it [00:41, 58.29it/s]



1921it [00:44, 43.28it/s]

====> Epoch: 2 Average loss: 0.0430
Training ...



3it [00:00, 14.77it/s]



310it [00:08, 53.40it/s]



609it [00:14, 51.79it/s]



907it [00:21, 34.84it/s]



1206it [00:28, 53.45it/s]



1508it [00:34, 51.49it/s]



1809it [00:42, 39.99it/s]



1921it [00:45, 42.34it/s]

====> Epoch: 3 Average loss: 0.0431
Training ...



7it [00:00, 33.59it/s]



307it [00:06, 53.18it/s]



604it [00:14, 31.72it/s]



910it [00:20, 55.16it/s]



1206it [00:26, 45.05it/s]



1508it [00:35, 49.82it/s]



1811it [00:41, 49.94it/s]



1921it [00:43, 43.80it/s]

====> Epoch: 4 Average loss: 0.0431
Training ...



5it [00:00, 22.57it/s]



306it [00:08, 34.22it/s]



607it [00:14, 49.93it/s]



907it [00:21, 35.10it/s]



1208it [00:29, 52.84it/s]



1509it [00:35, 52.32it/s]



1803it [00:42, 29.37it/s]



1921it [00:46, 41.63it/s]

====> Epoch: 5 Average loss: 0.0431
Training ...



6it [00:00, 27.90it/s]



311it [00:06, 50.27it/s]



607it [00:13, 34.00it/s]



909it [00:20, 50.39it/s]



1211it [00:26, 57.99it/s]



1505it [00:34, 29.71it/s]



1810it [00:41, 54.11it/s]



1921it [00:43, 43.96it/s]

====> Epoch: 6 Average loss: 0.0434
Training ...



6it [00:00, 29.39it/s]



307it [00:07, 33.32it/s]



610it [00:14, 54.11it/s]



909it [00:20, 52.09it/s]



1204it [00:28, 34.95it/s]



1507it [00:34, 52.89it/s]



1806it [00:40, 44.27it/s]



1921it [00:44, 43.35it/s]

====> Epoch: 7 Average loss: 0.0432
Training ...



5it [00:00, 18.62it/s]



310it [00:07, 55.65it/s]



608it [00:13, 54.07it/s]



905it [00:21, 37.19it/s]



1208it [00:27, 55.52it/s]



1507it [00:33, 37.81it/s]



1809it [00:41, 51.88it/s]



1921it [00:44, 43.52it/s]

====> Epoch: 8 Average loss: 0.0433
Training ...



7it [00:00, 33.47it/s]



304it [00:06, 44.87it/s]



612it [00:15, 53.52it/s]



910it [00:20, 54.71it/s]



1204it [00:27, 33.19it/s]



1510it [00:35, 53.23it/s]



1808it [00:40, 51.62it/s]



1921it [00:43, 43.76it/s]

====> Epoch: 9 Average loss: 0.0431
Training ...



2it [00:00, 10.57it/s]



307it [00:07, 51.65it/s]



606it [00:13, 53.50it/s]



908it [00:21, 34.89it/s]



1207it [00:28, 53.85it/s]



1504it [00:34, 34.62it/s]



1811it [00:42, 56.00it/s]



1921it [00:45, 42.59it/s]

====> Epoch: 10 Average loss: 0.0432
Training ...



5it [00:00, 24.45it/s]



307it [00:05, 51.73it/s]



605it [00:14, 32.76it/s]



908it [00:20, 56.36it/s]



1207it [00:26, 35.29it/s]



1507it [00:35, 54.47it/s]



1809it [00:41, 50.21it/s]



1921it [00:43, 44.38it/s]

====> Epoch: 11 Average loss: 0.0436
Training ...



8it [00:00, 37.05it/s]



308it [00:08, 36.90it/s]



608it [00:15, 51.99it/s]



904it [00:21, 32.19it/s]



1210it [00:29, 51.90it/s]



1509it [00:35, 52.46it/s]



1805it [00:42, 38.23it/s]



1921it [00:46, 41.68it/s]

====> Epoch: 12 Average loss: 0.0432
Training ...



3it [00:00, 13.02it/s]



311it [00:06, 54.28it/s]



605it [00:12, 35.32it/s]



911it [00:20, 52.43it/s]



1212it [00:26, 55.75it/s]



1504it [00:33, 34.84it/s]



1811it [00:41, 52.32it/s]



1921it [00:43, 44.10it/s]

====> Epoch: 13 Average loss: 0.0427
Training ...



6it [00:00, 32.62it/s]



308it [00:07, 36.60it/s]



608it [00:15, 52.15it/s]



911it [00:20, 52.36it/s]



1206it [00:28, 35.24it/s]



1506it [00:35, 51.87it/s]



1804it [00:41, 45.06it/s]



1921it [00:44, 43.06it/s]


====> Epoch: 14 Average loss: 0.0425
remove 1000 uncertain samples from du
Evaluation ...


625it [00:13, 46.77it/s]

Iteration: 22, len(dl): 30731, len(du): 31000, len(dh) 0, acc: 91.38 
Iteration: 23: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



1938it [00:46, 41.36it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 31731, len(du) 31000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 31731, len(du) 31000
Iteration: 23 fine-tune the model on dh U dl
Training ...



6it [00:00, 31.13it/s]



309it [00:05, 53.18it/s]



605it [00:13, 32.25it/s]



908it [00:20, 54.10it/s]



1207it [00:26, 52.58it/s]



1505it [00:34, 36.18it/s]



1810it [00:40, 52.81it/s]



1984it [00:44, 44.76it/s]

====> Epoch: 0 Average loss: 0.0428
Training ...



7it [00:00, 33.25it/s]



306it [00:09, 34.89it/s]



611it [00:14, 51.00it/s]



908it [00:21, 34.36it/s]



1210it [00:29, 54.35it/s]



1507it [00:35, 54.04it/s]



1808it [00:43, 34.68it/s]



1984it [00:47, 41.57it/s]

====> Epoch: 1 Average loss: 0.0427
Training ...



5it [00:00, 25.36it/s]



311it [00:06, 52.14it/s]



607it [00:14, 36.50it/s]



912it [00:20, 55.35it/s]



1206it [00:26, 53.49it/s]



1505it [00:35, 33.28it/s]



1811it [00:41, 49.57it/s]



1984it [00:44, 44.42it/s]

====> Epoch: 2 Average loss: 0.0427
Training ...



8it [00:00, 34.69it/s]



309it [00:09, 46.52it/s]



609it [00:14, 52.25it/s]



907it [00:22, 33.98it/s]



1213it [00:29, 55.26it/s]



1513it [00:35, 52.74it/s]



1805it [00:43, 34.73it/s]



1984it [00:47, 41.90it/s]

====> Epoch: 3 Average loss: 0.0423
Training ...



7it [00:00, 30.67it/s]



308it [00:06, 52.96it/s]



608it [00:14, 34.48it/s]



908it [00:20, 52.83it/s]



1210it [00:26, 52.55it/s]



1505it [00:35, 31.26it/s]



1807it [00:41, 54.41it/s]



1984it [00:45, 43.98it/s]

====> Epoch: 4 Average loss: 0.0424
Training ...



6it [00:00, 29.95it/s]



307it [00:08, 32.81it/s]



610it [00:14, 52.15it/s]



908it [00:21, 37.27it/s]



1209it [00:29, 52.51it/s]



1508it [00:35, 54.45it/s]



1805it [00:42, 38.18it/s]



1984it [00:47, 41.87it/s]

====> Epoch: 5 Average loss: 0.0428
Training ...



8it [00:00, 35.84it/s]



308it [00:06, 57.11it/s]



605it [00:13, 37.31it/s]



906it [00:20, 54.10it/s]



1212it [00:26, 51.90it/s]



1505it [00:34, 35.30it/s]



1811it [00:41, 53.82it/s]



1984it [00:44, 44.58it/s]

====> Epoch: 6 Average loss: 0.0424
Training ...



6it [00:00, 29.90it/s]



304it [00:08, 34.89it/s]



605it [00:15, 49.80it/s]



902it [00:20, 42.67it/s]



1212it [00:29, 52.02it/s]



1508it [00:35, 52.81it/s]



1805it [00:42, 35.72it/s]



1984it [00:48, 41.23it/s]

====> Epoch: 7 Average loss: 0.0427
Training ...



9it [00:00, 43.41it/s]



307it [00:06, 50.33it/s]



605it [00:12, 35.42it/s]



907it [00:20, 50.56it/s]



1208it [00:26, 54.42it/s]



1508it [00:34, 36.11it/s]



1812it [00:41, 53.09it/s]



1984it [00:44, 44.37it/s]

====> Epoch: 8 Average loss: 0.0423
Training ...



7it [00:00, 33.61it/s]



305it [00:07, 35.53it/s]



611it [00:14, 52.95it/s]



906it [00:20, 35.72it/s]



1207it [00:28, 39.35it/s]



1508it [00:35, 53.94it/s]



1805it [00:41, 33.08it/s]



1984it [00:46, 42.36it/s]

====> Epoch: 9 Average loss: 0.0422
Training ...



5it [00:00, 23.91it/s]



311it [00:06, 54.01it/s]



606it [00:13, 36.16it/s]



910it [00:21, 51.25it/s]



1207it [00:27, 51.49it/s]



1505it [00:34, 32.89it/s]



1811it [00:42, 52.74it/s]



1984it [00:45, 43.59it/s]

====> Epoch: 10 Average loss: 0.0428
Training ...



5it [00:00, 25.61it/s]



307it [00:07, 40.44it/s]



611it [00:15, 54.71it/s]



907it [00:21, 50.87it/s]



1208it [00:29, 34.86it/s]



1509it [00:36, 47.69it/s]



1807it [00:42, 33.32it/s]



1984it [00:48, 41.32it/s]

====> Epoch: 11 Average loss: 0.0436
Training ...



4it [00:00, 14.81it/s]



307it [00:06, 52.35it/s]



608it [00:13, 34.70it/s]



906it [00:22, 49.78it/s]



1210it [00:28, 53.53it/s]



1508it [00:35, 34.96it/s]



1811it [00:43, 50.72it/s]



1984it [00:47, 41.97it/s]

====> Epoch: 12 Average loss: 0.0431
Training ...



7it [00:00, 36.92it/s]



309it [00:07, 39.00it/s]



609it [00:15, 55.97it/s]



908it [00:21, 37.28it/s]



1207it [00:29, 36.44it/s]



1510it [00:35, 55.12it/s]



1806it [00:42, 31.54it/s]



1984it [00:47, 41.88it/s]

====> Epoch: 13 Average loss: 0.0420
Training ...



4it [00:00, 18.49it/s]



307it [00:06, 49.59it/s]



606it [00:13, 35.59it/s]



910it [00:21, 51.75it/s]



1211it [00:27, 53.61it/s]



1507it [00:35, 35.36it/s]



1812it [00:42, 51.89it/s]



1984it [00:46, 42.99it/s]


====> Epoch: 14 Average loss: 0.0421
remove 1000 uncertain samples from du
Evaluation ...


625it [00:15, 40.90it/s]

Iteration: 23, len(dl): 31731, len(du): 30000, len(dh) 0, acc: 87.61 
Iteration: 24: run prediction on unlabeled data `du` 
Prediction on Unlabelled Data ...



1875it [00:43, 43.42it/s]

Update size of `dl`  and `du` by adding uncertain 1000 samples in `dl` len(dl): 32731, len(du) 30000
Update size of `dl`  and `du` by adding 0 hcs samples in `dl` len(dl): 32731, len(du) 30000
Iteration: 24 fine-tune the model on dh U dl
Training ...



6it [00:00, 25.65it/s]



305it [00:09, 36.86it/s]



611it [00:15, 54.41it/s]



907it [00:22, 31.92it/s]



1207it [00:30, 52.08it/s]



1507it [00:35, 54.84it/s]



1807it [00:43, 35.94it/s]



2046it [00:49, 41.36it/s]

====> Epoch: 0 Average loss: 0.0422
Training ...



7it [00:00, 34.50it/s]



310it [00:06, 50.18it/s]



605it [00:14, 30.30it/s]



909it [00:21, 52.23it/s]



1205it [00:27, 40.84it/s]



1507it [00:36, 51.43it/s]



1812it [00:42, 53.85it/s]



2046it [00:47, 42.96it/s]

====> Epoch: 1 Average loss: 0.0421
Training ...



4it [00:00, 14.72it/s]



309it [00:08, 51.50it/s]



608it [00:14, 44.18it/s]



905it [00:22, 32.49it/s]



1211it [00:29, 50.75it/s]



1505it [00:35, 34.62it/s]



1811it [00:44, 53.71it/s]



2046it [00:48, 41.87it/s]

====> Epoch: 2 Average loss: 0.0424
Training ...



4it [00:00, 18.76it/s]



305it [00:07, 35.26it/s]



606it [00:15, 52.67it/s]



909it [00:20, 53.69it/s]



1206it [00:28, 33.37it/s]



1506it [00:35, 52.13it/s]



1808it [00:42, 52.15it/s]



2046it [00:49, 41.68it/s]

====> Epoch: 3 Average loss: 0.0424
Training ...



5it [00:00, 16.93it/s]



307it [00:06, 52.49it/s]



604it [00:13, 33.28it/s]



910it [00:21, 54.96it/s]



1206it [00:27, 46.49it/s]



1507it [00:35, 30.88it/s]



1811it [00:42, 53.85it/s]



2046it [00:47, 43.19it/s]

====> Epoch: 4 Average loss: 0.0430
Training ...



6it [00:00, 32.25it/s]



308it [00:08, 34.49it/s]



608it [00:15, 53.39it/s]



906it [00:21, 38.97it/s]



1209it [00:30, 48.73it/s]



1508it [00:36, 36.31it/s]



1808it [00:43, 35.21it/s]



2046it [00:50, 40.85it/s]

====> Epoch: 5 Average loss: 0.0422
Training ...



6it [00:00, 27.83it/s]



312it [00:06, 53.56it/s]



605it [00:13, 34.53it/s]



910it [00:20, 45.55it/s]



1207it [00:26, 51.05it/s]



1507it [00:35, 30.68it/s]



1806it [00:41, 52.68it/s]



2046it [00:46, 44.16it/s]

====> Epoch: 6 Average loss: 0.0420
Training ...



4it [00:00, 20.15it/s]



311it [00:09, 47.72it/s]



607it [00:15, 50.11it/s]



905it [00:22, 32.10it/s]



1208it [00:30, 48.50it/s]



1508it [00:36, 52.47it/s]



1805it [00:44, 36.69it/s]



2046it [00:50, 40.88it/s]

====> Epoch: 7 Average loss: 0.0422
Training ...



7it [00:00, 32.72it/s]



309it [00:05, 52.51it/s]



608it [00:14, 34.03it/s]



907it [00:20, 53.61it/s]



1207it [00:27, 35.23it/s]



1511it [00:36, 45.74it/s]



1808it [00:41, 52.69it/s]



2046it [00:47, 42.81it/s]

====> Epoch: 8 Average loss: 0.0423
Training ...



3it [00:00, 11.82it/s]



306it [00:07, 53.74it/s]



607it [00:13, 56.84it/s]



906it [00:21, 34.79it/s]



1207it [00:28, 52.69it/s]



1503it [00:35, 30.40it/s]



1812it [00:43, 54.31it/s]



2046it [00:48, 42.29it/s]

====> Epoch: 9 Average loss: 0.0423
Training ...



3it [00:00, 20.74it/s]



304it [00:07, 34.11it/s]



611it [00:15, 56.93it/s]



913it [00:20, 57.86it/s]



1207it [00:29, 32.93it/s]



1512it [00:35, 54.21it/s]



1808it [00:42, 35.64it/s]



2046it [00:49, 41.40it/s]

====> Epoch: 10 Average loss: 0.0420
Training ...



4it [00:00, 17.92it/s]



310it [00:06, 51.88it/s]



603it [00:13, 32.15it/s]



911it [00:21, 52.34it/s]



1213it [00:27, 54.87it/s]



1507it [00:35, 32.15it/s]



1807it [00:42, 51.03it/s]



2046it [00:46, 43.55it/s]


====> Epoch: 11 Average loss: 0.0426
Training ...


5it [00:00, 27.49it/s]



305it [00:09, 34.62it/s]



607it [00:15, 53.33it/s]



904it [00:21, 41.76it/s]



1212it [00:30, 52.27it/s]



1510it [00:36, 52.91it/s]



1805it [00:43, 32.64it/s]



2046it [00:49, 41.27it/s]

====> Epoch: 12 Average loss: 0.0419
Training ...



5it [00:00, 24.87it/s]



310it [00:06, 51.65it/s]



607it [00:14, 34.35it/s]



909it [00:21, 53.44it/s]



1207it [00:27, 37.36it/s]



1509it [00:36, 42.02it/s]



1808it [00:42, 53.53it/s]



2046it [00:47, 42.85it/s]

====> Epoch: 13 Average loss: 0.0426
Training ...



5it [00:00, 19.29it/s]



306it [00:08, 47.33it/s]



606it [00:13, 52.54it/s]



905it [00:22, 32.16it/s]



1211it [00:29, 53.07it/s]



1505it [00:35, 34.88it/s]



1809it [00:43, 49.42it/s]



2046it [00:48, 41.94it/s]


====> Epoch: 14 Average loss: 0.0421
remove 1000 uncertain samples from du
Evaluation ...


625it [00:15, 40.12it/s]

Iteration: 24, len(dl): 32731, len(du): 29000, len(dh) 0, acc: 91.35 





In [None]:
len(dataset_train)

42000