In [1]:
"""
Boilerplate to implement training different networks on different datasets
with varying config.

I wish a machine could automate setting up decent baseline models and datasets
"""
#  import json
import os
from os.path import exists
import pampy
from simple_parsing import ArgumentParser, choice
from simplepytorch import datasets as D
from simplepytorch import trainlib as TL
from simplepytorch import metrics
from sklearn.model_selection import StratifiedShuffleSplit
from torch.utils.data import Dataset, DataLoader
from typing import Union, Optional
import dataclasses as dc
import numpy as np
import torch as T
import torchvision.transforms as tvt

from deepfix.models import get_effnetv2, get_resnet, get_efficientnetv1, get_DeepFixEnd2End, DeepFixMLP
from deepfix.models.ghaarconv import convert_conv2d_to_gHaarConv2d
from deepfix.init_from_distribution import init_from_beta, reset_optimizer
from deepfix import deepfix_strategies as dfs
import pytorch_wavelets as pyw



In [2]:
MODELS = {
    ('effnetv2', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_effnetv2(pretrain, int(in_ch), int(out_ch))),
    ('resnet50', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_resnet('resnet50', pretrain, int(in_ch), int(out_ch))),
    ('resnet18', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_resnet('resnet18', pretrain, int(in_ch), int(out_ch))),
    ('efficientnet-b0', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_efficientnetv1('efficientnet-b0', pretrain, int(in_ch), int(out_ch))),
    ('efficientnet-b1', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_efficientnetv1('efficientnet-b1', pretrain, int(in_ch), int(out_ch))),
    ('waveletres18', str, str, str): lambda pretrain, in_ch, out_ch: R(
        pretrain, int(in_ch), int(out_ch)),
    ('waveletmlp', str, str, str, str, str, str, str): (
        lambda mlp_channels, in_ch, out_ch, wavelet_levels, patch_size, in_ch_mul, mlp_depth: get_DeepFixEnd2End(
            int(in_ch), int(out_ch),
            in_ch_multiplier=int(in_ch_mul), wavelet='db1',
            wavelet_levels=int(wavelet_levels), wavelet_patch_size=int(patch_size),
            mlp_depth=int(mlp_depth), mlp_channels=int(mlp_channels),
            mlp_fix_weights='none', mlp_activation=None)
        ),

    #  ('waveletres18v2', str, str, str): lambda pretrain, in_ch, out_ch: (
        #  DeepFixCompression(levels=8, wavelet='coif1', patch_size=1),
        #  R2(pretrain, int(in_ch), int(out_ch))),
}


class R(T.nn.Module):
    def __init__(self, pretrain, in_ch, out_ch):
        super().__init__()
        self.r = get_resnet('resnet18', pretrain, in_ch, out_ch,)
        self.dwt = pyw.DWT(J=8, wave='coif1', mode='zero')

    @staticmethod
    def wavelet_coefficients_as_tensorimage(approx, detail, normalize=False):
        B,C = approx.shape[:2]
        fixed_dims = approx.shape[:-2] # num images in minibatch, num channels, etc
        output_shape = fixed_dims + (
            detail[0].shape[-2]*2,  # input img height
            detail[0].shape[-1]*2)  # input img width
        im = T.zeros(output_shape, device=approx.device, dtype=approx.dtype)
        if normalize:
            norm11 = lambda x: (x / max(x.min()*-1, x.max()))  # into [-1,+1] preserving sign
            #  approx = norm11(approx)
        im[..., :approx.shape[-2], :approx.shape[-1]] = approx if approx is not None else 0
        for level in detail:
            lh, hl, hh = level.unbind(-3)
            h,w = lh.shape[-2:]
            if normalize:
                lh, hl, hh = [norm11(x) for x in [lh, hl, hh]]
            #  im[:h, :w] = approx
            im[..., 0:h, w:w+w] = lh  # horizontal
            im[..., h:h+h, :w] = hl  # vertical
            im[..., h:h+h, w:w+w] = hh  # diagonal
        return im

    def forward(self, x):
        x = self.wavelet_coefficients_as_tensorimage(*self.dwt(x))
        return self.r(x)


class R2(T.nn.Module):
    def __init__(self, pretrain, in_ch, out_ch):
        super().__init__()
        self.r = get_resnet('resnet18', pretrain, in_ch, out_ch,)

    def forward(self, x):
        B,C,H = x.shape
        x = x.unsqueeze(-1).repeat(1,1,1,H)
        return self.r(x)


class LossCheXpertIdentity(T.nn.Module):
    def __init__(self, N):
        super().__init__()
        self.bce = T.nn.BCEWithLogitsLoss()
        self.N = N

    def forward(self, yhat, y):
        # absolute max possible num patients in chexpert is 223414
        # but let's just hash them into a smaller number of bins via modulo N
        assert self.N == yhat.shape[1], \
                f'note: model must have {self.N} binary predictions per sample'
        y_onehot = y.new_zeros(y.shape[0], self.N, dtype=T.float
                               ).scatter_(1, y.long()%self.N, 1)
        return self.bce(yhat[:, -1], y_onehot[:, -1])


class LossCheXpertUignore(T.nn.Module):
    def __init__(self):
        super().__init__()
        self.bce = T.nn.BCEWithLogitsLoss()

    def forward(self, yhat, y):
        ignore = (y != 2)  # ignore uncertainty labels
        return self.bce(yhat[ignore], y[ignore])


def loss_intelmobileodt(yhat, y):
    """BCE Loss with class balancing weights.

    Not sure this actually helps

    because Type 2 is the hardest class, it
    has the most samples, and it separates Type 1 from Type 3.  Arguably, Type 2
    samples are on the decision boundary between Type 1 and 3.
    Class balancing weights make it harder to focus on class 2.
    """
    #  assert y.shape == yhat.shape, 'sanity check'
    #  assert y.dtype == yhat.dtype, 'sanity check'

    # class distribution of stage='train'
    w = T.tensor([249, 781, 450], dtype=y.dtype, device=y.device)
    w = (w.max() / w).reshape(1, 3)
    # w can have any of the shapes:  (B,1) or (1,C) or (B,C)
    #  return T.nn.functional.binary_cross_entropy_with_logits(yhat, y, weight=w)
    return T.nn.functional.cross_entropy(yhat, y, weight=w)
    # can't apply focal loss unless do it manually.


def onehot(y, nclasses):
    return T.zeros((y.numel(), nclasses), dtype=y.dtype, device=y.device)\
            .scatter_(1, y.unsqueeze(1), 1)


def _upsample_pad_minibatch_imgs_to_same_size(batch, target_is_segmentation_mask=False):
    """a collate function for a dataloader of (x,y) samples.  """
    shapes = [item[0].shape for item in batch]
    H = max(h for c,h,w in shapes)
    W = max(w for c,h,w in shapes)
    X, Y = [], []
    for item in batch:
        h,w = item[0].shape[1:]
        dh, dw = (H-h), (W-w)
        padding = (dw//2, dw-dw//2, dh//2, dh-dh//2, )
        X.append(T.nn.functional.pad(item[0], padding))
        if target_is_segmentation_mask:
            Y.append(T.nn.functional.pad(item[1], padding))
        else:
            Y.append(item[1])
    return T.stack(X), T.stack(Y)


def get_dset_chexpert(train_frac=.8, val_frac=.2, small=False,
                      labels:str='diagnostic', num_identities=None):
    """
    Args:
        labels:  either "diagnostic" (the 14 classes defined as
            D.CheXpert.LABELS_DIAGNOSTIC) or "identity" ("patient", "study",
            "view", "index")
        small:  whether to use CheXpert_Small dataset (previously downsampled
            images) or the fully size dataset.
        num_identities:  used only if labels='identity'.  If
            num_identities=1000, then all patients get identified as coming
            from precisely 1 of 1000 bins.

    Returns:
        (
        {'train_dset': ..., 'val_dset': ..., 'test_dset': ...,
         'train_loader': ..., 'val_loader': ..., 'test_loader': ...
         },

        ('Pneumonia', 'Cardiomegaly', ...)  # class names defined by `labels`
        )
    """
    _label_cleanup_dct = dict(D.CheXpert.LABEL_CLEANUP_DICT)
    if labels == 'diagnostic':
        class_names = D.CheXpert.LABELS_DIAGNOSTIC
        for k in class_names:
            _label_cleanup_dct[k][np.nan] = 0  # remap missing value to negative
        get_ylabels = lambda dct: \
                D.CheXpert.format_labels(dct, labels=class_names).float()
    elif labels == 'identity':
        class_names = list(range(num_identities))
        get_ylabels = lambda dct: \
                (D.CheXpert.format_labels(dct, labels=['index']) % num_identities).long()
    else:
        raise NotImplementedError(f"unrecognized labels: {labels}")
    kws = dict(
        img_transform=tvt.Compose([
#              tvt.RandomCrop((512, 512)),
            tvt.ToTensor(),  # full res 1024x1024 imgs
        ]),
        getitem_transform=lambda dct: (dct['image'], get_ylabels(dct)),
        label_cleanup_dct=_label_cleanup_dct,
    )
    if small:
        kls = D.CheXpert_Small
    else:
        kls = D.CheXpert

    train_dset = kls(dataset_dir="../data/CheXpert-v1.0-small/",use_train_set=True, **kws)  #Edited Elvin

    N = len(train_dset)
    if train_frac + val_frac == 1:
        nsplits = [N - int(N*val_frac), int(N*val_frac), 0]
    else:
        a,b = int(N*train_frac), int(N*val_frac)
        nsplits = [a,b, N-a-b]
    train_dset, val_dset, _ = T.utils.data.random_split(train_dset, nsplits)
    test_dset = kls(dataset_dir="../data/CheXpert-v1.0-small/",use_train_set=False, **kws) #Edited Elvin
    batch_dct = dict(
        batch_size=15, collate_fn=_upsample_pad_minibatch_imgs_to_same_size,
        num_workers=int(os.environ.get("num_workers", 4)))  # upsample pad must take time
    train_loader=DataLoader(train_dset, shuffle=True, **batch_dct)
    val_loader=DataLoader(val_dset, **batch_dct)
    test_loader=DataLoader(test_dset, **batch_dct)
    return (dict(
        train_dset=train_dset, val_dset=val_dset, test_dset=test_dset,
        train_loader=train_loader, val_loader=val_loader, test_loader=test_loader,
    ), class_names)


def get_dset_intel_mobileodt(stage_trainval:str, use_val:str, stage_test:str, augment:str
                             ) -> (dict[str,Optional[Union[Dataset,DataLoader]]], tuple[str]):
    """Obtain train/val/test splits for the IntelMobileODT Cervical Cancer
    Colposcopy dataset, and the data loaders.

    Args:
        stage_trainval: the `stage` for training and validation.
            i.e. Possible choices:  {'train', 'train+additional'}
            Train / val split is 70/30 random stratified split.
        use_val: Whether to create a validation set
            Choices:  {"val", "noval"}
        stage_test: the `stage` for test set.  Should be "test".
        augment: Type of augmentations to apply.  One of {'v1', }.
            "v1" - make the aspect ratio .75, resize images to (200,150), and convert in range [0,1]
    Returns:
        (
        {'train_dset': ..., 'val_dset': ..., 'test_dset': ...,
         'train_loader': ..., 'val_loader': ..., 'test_loader': ...
         },

        ('Type 1', 'Type 2', 'Type 3')
        )
    """
    assert augment == 'v1', 'code bug: other augmentations not implemented'
    base_dir = './data/intel_mobileodt_cervical_resized'
    dset_trainval = D.IntelMobileODTCervical(stage_trainval, base_dir)
    _y = [dset_trainval.getitem(i, load_img=False)
          for i in range(len(dset_trainval))]
    dct = {'test_dset': D.IntelMobileODTCervical(stage_test, base_dir)}
    if use_val == 'noval':
        dct['train_dset'] = dset_trainval
        dct['val_dset'] = None
    else:
        assert use_val == 'val', f'unrecognized option: {use_val}'
        idxs_train, idxs_val = list(
            StratifiedShuffleSplit(1, test_size=.3).split(
                np.arange(len(dset_trainval)), _y))[0]
        dct['train_dset'] = T.utils.data.Subset(dset_trainval, idxs_train)
        dct['val_dset'] = T.utils.data.Subset(dset_trainval, idxs_val)

    # preprocess train/val/test images all the same way
    preprocess_v1 = tvt.Compose([
        #
        ### previously done (to save computation time) ###
        #  D.IntelMobileODTCervical.fix_aspect_ratio,
        #  tvt.Resize((200, 150)),  # interpolation=tvt.InterpolationMode.NEAREST),
        #
        lambda x: x.float()/255.
    ])
    dct = {k: D.PreProcess(v, lambda xy: (
        preprocess_v1(xy[0]),
        #  onehot(xy[1].unsqueeze(0).long()-1, 3).squeeze_().float()))
        xy[1].long()-1))
        for k,v in dct.items()}
    dct.update(dict(
        train_loader=DataLoader(dct['train_dset'], batch_size=20, shuffle=True),
        test_loader=DataLoader(dct['test_dset'], batch_size=20),))
    if dct['val_dset'] is None:
        dct['val_loader'] = None
    else:
        dct['val_loader'] = DataLoader(dct['val_dset'], batch_size=20)
    class_names = [x.replace('_', ' ') for x in D.IntelMobileODTCervical.LABEL_NAMES]
    return dct, class_names


LOSS_FNS = {
    ('BCEWithLogitsLoss', ): lambda _: T.nn.BCEWithLogitsLoss(),
    ('CrossEntropyLoss', ): lambda _: T.nn.CrossEntropyLoss(),
    ('CE_intelmobileodt', ): lambda _: loss_intelmobileodt,
    ('chexpert_uignore', ): lambda _: LossCheXpertUignore(),
    ('chexpert_identity', str): lambda out_ch: LossCheXpertIdentity(N=int(out_ch)),
}

DSETS = {
    ('intel_mobileodt', str, str, str, str): (
        lambda train, val, test, aug: get_dset_intel_mobileodt(train, val, test, aug)),
    #  ('origa', ... todo): ( lambda ...: get_dset_origa(...)
    #  ('riga', ... todo): ( lambda ...: get_dset_riga(...)
    ('chexpert', str, str): (
        lambda train_frac, val_frac: get_dset_chexpert(
            float(train_frac), float(val_frac), small=False, labels='diagnostic')),
    ('chexpert_small', str, str): (
        lambda train_frac, val_frac: get_dset_chexpert(
            float(train_frac), float(val_frac), small=True, labels='diagnostic')),
    ('chexpert_small_ID', str, str, str): (
        lambda num_identities, train_frac, val_frac: get_dset_chexpert(
            float(train_frac), float(val_frac), small=True,
            labels='identity', num_identities=int(num_identities))),
}


def match(spec:str, dct:dict):
    return pampy.match(spec.split(':'), *(x for y in dct.items() for x in y))


def get_model_opt_loss(
        model_spec:str, opt_spec:str, loss_spec:str, regularizer_spec:str,
        device:str) -> dict[str, Union[T.nn.Module, T.optim.Optimizer]]:
    """
    Args:
        model_spec: a string of form,
            "model_name:pretraining:in_channels:out_classes".  For example:
            "effnetv2:untrained:1:5"
        opt_spec: Specifies how to create optimizer.
            First value is a pytorch Optimizer in T.optim.*.
            Other values are numerical parameters.
            Example: "SGD:lr=.003:momentum=.9"
        device: e.g. 'cpu' or 'gpu'
    Returns:
        a pytorch model and optimizer
    """
    mdl = match(model_spec, MODELS)
    mdl = mdl.to(device, non_blocking=True)
    optimizer = reset_optimizer(opt_spec, mdl)
    loss_fn = match(loss_spec, LOSS_FNS)
    if regularizer_spec != 'none':
        loss_fn = RegularizedLoss(mdl, loss_fn, regularizer_spec)
    return dict(model=mdl, optimizer=optimizer, loss_fn=loss_fn)


class RegularizedLoss(T.nn.Module):
    def __init__(self, model, lossfn, regularizer_spec:str):
        super().__init__()
        self.lossfn = lossfn
        self.regularizer_spec = regularizer_spec
        if regularizer_spec == 'none':
            self.regularizer = lambda *y: 0
        elif regularizer_spec.startswith('deepfixmlp:'):
            lbda = float(regularizer_spec.split(':')[1])
            self.regularizer = lambda *y: (
                float(lbda) * DeepFixMLP.get_VecAttn_regularizer(model))
        else:
            raise NotImplementedError(regularizer_spec)

    def forward(self, yhat, y):
        return self.lossfn(yhat, y) + self.regularizer(yhat, y)

    def __repr__(self):
        return f'RegularizedLoss<{repr(self.lossfn)},{self.regularizer_spec}>'


def get_dset_loaders_resultfactory(dset_spec:str) -> dict:
    dct, class_names = match(dset_spec, DSETS)
    if any(dset_spec.startswith(x) for x in {'intel_mobileodt:',
                                             'chexpert_small_ID:'}):
        #  dct['result_factory'] = lambda: TL.MultiLabelBinaryClassification(
                #  class_names, binarize_fn=lambda yh: (T.sigmoid(yh)>.5).long())
        dct['result_factory'] = lambda: TL.MultiClassClassification(
                len(class_names), binarize_fn=lambda yh: yh.softmax(1).argmax(1))
    elif any(dset_spec.startswith(x) for x in {'chexpert:', 'chexpert_small:'}):
        dct['result_factory'] = lambda: CheXpertMultiLabelBinaryClassification(
            class_names, binarize_fn=lambda yh: (yh.sigmoid()>.5).long(), report_avg=True)
    else:
        raise NotImplementedError(f"I don't know how to create the result factory for {dset_spec}")
    return dct

class CheXpertMultiLabelBinaryClassification(TL.MultiLabelBinaryClassification):
    def update(self, yhat, y, loss) -> None:
        self.num_samples += yhat.shape[0]
        self.loss += loss.item()
        assert yhat.shape == y.shape
        assert yhat.ndim == 2 and yhat.shape[1] == len(self._cms), "sanity check: model outputs expected prediction shape"
        binarized = self._binarize_fn(yhat)
        assert binarized.dtype == T.long, 'sanity check binarize fn'
        assert binarized.shape == y.shape, 'sanity check binarize fn'
        ignore = (y != 2)  # ignore uncertainty labels
        for i, (kls, cm) in enumerate(self._cms.items()):
            rows = ignore[:, i]
            if rows.sum() == 0:
                continue  # don't update a confusion matrix if all data for this class is ignored
            cm += metrics.confusion_matrix(y[rows, i], binarized[rows, i], num_classes=2).cpu()


def get_deepfix_train_strategy(args:'TrainOptions'):
    deepfix_spec = args.deepfix
    if deepfix_spec == 'off':
        return TL.train_one_epoch
    elif deepfix_spec.startswith('reinit:'):
        _, N, P, R = deepfix_spec.split(':')
        return dfs.DeepFix_TrainOneEpoch(int(N), float(P), int(R), TL.train_one_epoch)
    elif deepfix_spec.startswith('dhist:'):
        fp = deepfix_spec.split(':', 1)[1]
        assert exists(fp), f'histogram file not found: {fp}'
        return dfs.DeepFix_DHist(fp)
    elif deepfix_spec.startswith('dfhist:'):
        fp = deepfix_spec.split(':', 1)[1]
        assert exists(fp), f'histogram file not found: {fp}'
        return dfs.DeepFix_DHist(fp, fixed=True)
    elif deepfix_spec == 'fixed':
        return dfs.DeepFix_DHist('', fixed=True, init_with_hist=False)
    elif deepfix_spec.startswith('beta:'):
        alpha, beta = deepfix_spec.split(':')[1:]
        return dfs.DeepFix_LambdaInit(
            lambda cfg: init_from_beta(cfg.model, float(alpha), float(beta)))
    elif deepfix_spec.startswith('ghaarconv2d:'):
        ignore_layers = deepfix_spec.split(':')[1].split(',')
        return dfs.DeepFix_LambdaInit(
            lambda cfg: (
                print(f'initialize {deepfix_spec}'),
                convert_conv2d_to_gHaarConv2d(cfg.model, ignore_layers=ignore_layers),
                reset_optimizer(args.opt, cfg.model),
                print(cfg.model)
            ))
    else:
        raise NotImplementedError(deepfix_spec)


def train_config(args:'TrainOptions') -> TL.TrainConfig:
    return TL.TrainConfig(
        **get_model_opt_loss(
            args.model, args.opt, args.lossfn, args.loss_reg, args.device),
        **get_dset_loaders_resultfactory(args.dset),
        device=args.device,
        epochs=args.epochs,
        start_epoch=args.start_epoch,
        train_one_epoch=get_deepfix_train_strategy(args),
        experiment_id=args.experiment_id,
    )


@dc.dataclass
class TrainOptions:
    """High-level configuration for training PyTorch models
    on the IntelMobileODTCervical dataset.
    """
    epochs:int = 50
    start_epoch:int = 0  # if "--start_epoch 1", then don't evaluate perf before training.
    device:str = 'cuda' if T.cuda.is_available() else 'cpu'
    dset:str = None #choice(
        #  'intel_mobileodt:train:val:test:v1',
        #  'intel_mobileodt:train+additional:val:test:v1',
        #  'intel_mobileodt:train+additional:noval:test:v1',
        #  'chexpert:.8:.2', 'chexpert:.01:.01', 'chexpert:.001:.001',
        #  'chexpert_small:.8:.2', 'chexpert_small:.01:.01',
        #   'chexpert_small:.001:.001',
        #  default='intel_mobileodt:train:val:test:v1')
    opt:str = 'SGD:lr=.001:momentum=.9:nesterov=1'
    lossfn:str = None  # choices:
        #  'BCEWithLogitsLoss',
        #  'CrossEntropyLoss', 
        #  'CE_intelmobileodt',
        #  'chexpert_uignore', 
        #  'chexpert_identity:N' for some N=num_identities predicted by model (compared to identities y%N)
    loss_reg:str = 'none'  # Optionally add a regularizer to the loss.  loss + reg.  Accepted values:  'none', 'deepfixmlp:X' where X is a positive float denoting the lambda in l1 regularizer
    model:str = 'resnet18:imagenet:3:3'  # Model specification adheres to the template "model_name:pretraining:in_ch:out_ch"
    deepfix:str = 'off'  # DeepFix Re-initialization Method.
                         #  "off" or "reinit:N:P:R" or "d[f]hist:path_to_histogram.pth"
                         #  or "beta:A:B" for A,B as (float) parameters of the beta distribution
                         # 'ghaarconv2d:layer1,layer2' Replaces all spatial convolutions with GHaarConv2d layer except the specified layers
    experiment_id:str = os.environ.get('run_id', 'debugging')
    prune:str = 'off'

    def execute(self):
        cfg = train_config(self)
        cfg.train(cfg)


def main():
    p = ArgumentParser()
    p.add_arguments(TrainOptions, dest='TrainOptions')
#     for patch_size in [1,32]:
#         for wavelet_level in [1,2,3,4,5,6,7,8,9]:    
#             try:
    in_ch, out_ch = 1, 14
    model_params = "efficientnet-b0:imagenet:"+str(in_ch)+":"+str(out_ch)    
    
#     model_params = "waveletmlp:300:1:14:"+str(patch_size)+":"+str(wavelet_level)+":1:2"
    exp_id = 'model_'+model_params+'_in_ch_'+str(in_ch)+'out_ch_'+str(out_ch)#+'_patch_size_' + str(patch_size) + '_level_' + str(wavelet_level)
    args = p.parse_args(["--dset", "chexpert_small:.01:.01", "--opt", "Adam:lr=0.001", "--lossfn", "chexpert_uignore", "--model", model_params, "--loss_reg", "none","--experiment_id",exp_id]).TrainOptions

    print(args)
    cfg = train_config(args)

# python deepfix/train.py --dset chexpert_small:.01:.01 --opt Adam:lr=0.001 --lossfn chexpert_uignore --model waveletmlp:300:1:14:7:1:1:2 --loss_reg none    

    if args.prune != 'off':
        assert args.prune.startswith('ChannelPrune:')
        raise NotImplementedError('code is a bit hardcoded, so it is not available without hacking on it.')
        print(args.prune)
        from explainfix import channelprune
        from deepfix.weight_saliency import costfn_multiclass
        a = sum([x.numel() for x in cfg.model.parameters()])
        channelprune(cfg.model, pct=5, grad_cost_fn=costfn_multiclass,
                     loader=cfg.train_loader, device=cfg.device, num_minibatches=10)
        b = sum([x.numel() for x in cfg.model.parameters()])
        assert a/b != 1
        print(f'done channelpruning.  {a/b}')

    cfg.train(cfg)
#             except Exception as e:
#                 print("=================================================================================================")
#                 print(e)
#                 print("=================================================================================================")
            
    print('+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++')
    #  import IPython ; IPython.embed() ; import sys ; sys.exit()

    #  with T.profiler.profile(
    #      activities=[
    #          T.profiler.ProfilerActivity.CPU,
    #          T.profiler.ProfilerActivity.CUDA,
    #      ], with_modules=True,
    #  ) as p:
    #      cfg.train(cfg)
    #  print(p.key_averages().table(
    #      sort_by="self_cuda_time_total", row_limit=-1))


if __name__ == "__main__":
    main()


TrainOptions(epochs=50, start_epoch=0, device='cuda', dset='chexpert_small:.01:.01', opt='Adam:lr=0.001', lossfn='chexpert_uignore', loss_reg='none', model='efficientnet-b0:imagenet:1:14', deepfix='off', experiment_id='model_efficientnet-b0:imagenet:1:14_in_ch_1out_ch_14', prune='off')
Loaded pretrained weights for efficientnet-b0
Checkpoint ./results/model_efficientnet-b0:imagenet:1:14_in_ch_1out_ch_14/checkpoints/epoch_0.pth


100%|██████████| 149/149 [00:42<00:00,  3.47it/s]
100%|██████████| 149/149 [00:49<00:00,  2.99it/s]
100%|██████████| 16/16 [00:06<00:00,  2.66it/s]
INFO:simplepytorch.logging_tools:DataLogger writing to file: /ocean/projects/cie160013p/elvinj/DeepFix/deepfix/results/model_efficientnet-b0:imagenet:1:14_in_ch_1out_ch_14/log/20220130T044641.929087_perf.csv


[1m[32mepoch[0m:    0, [1m[32mseconds_training_epoch[0m: nan
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  102.53449, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  nan, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m: -0.04262, [1m[36mtrain_MCC Lung Opacity[0m:  0.06814, [1m[36mtrain_MCC Lung Lesion[0m:  0.06527, [1m[36mtrain_MCC Edema[0m:  0.12473, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m: -0.00124, [1m[36mtrain_MCC Pneumothorax[0m:  nan, [1m[36mtrain_MCC Pleural Effusion[0m:  0.03694, [1m[36mtrain_MCC Pleural Other[0m:  0.00385, [1m[36mtrain_MCC Fracture[0m:  0.01856, [1m[36mtrain_MCC Support Devices[0m: -0.00958, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.00000, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Ca

100%|██████████| 149/149 [01:08<00:00,  2.18it/s]
100%|██████████| 149/149 [00:38<00:00,  3.90it/s]
100%|██████████| 16/16 [00:04<00:00,  3.75it/s]


[1m[32mepoch[0m:    1, [1m[32mseconds_training_epoch[0m: 68.3697
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  54.04770, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.13166, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m: -0.01673, [1m[36mtrain_MCC Cardiomegaly[0m: -0.01201, [1m[36mtrain_MCC Lung Opacity[0m:  0.13806, [1m[36mtrain_MCC Lung Lesion[0m: -0.01581, [1m[36mtrain_MCC Edema[0m:  0.19804, [1m[36mtrain_MCC Consolidation[0m:  0.01040, [1m[36mtrain_MCC Pneumonia[0m: -0.00882, [1m[36mtrain_MCC Atelectasis[0m: -0.02816, [1m[36mtrain_MCC Pneumothorax[0m: -0.01257, [1m[36mtrain_MCC Pleural Effusion[0m:  0.22537, [1m[36mtrain_MCC Pleural Other[0m: -0.00686, [1m[36mtrain_MCC Fracture[0m: -0.01068, [1m[36mtrain_MCC Support Devices[0m:  0.31275, [1m[36mtrain_MCC AVG[0m:  0.06462, [1m[36mtrain_Precision No Finding[0m:  0.41026, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, 

100%|██████████| 149/149 [00:57<00:00,  2.60it/s]
100%|██████████| 149/149 [00:39<00:00,  3.78it/s]
100%|██████████| 16/16 [00:04<00:00,  3.63it/s]


[1m[32mepoch[0m:    2, [1m[32mseconds_training_epoch[0m: 57.2126
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  49.93827, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.16333, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.03369, [1m[36mtrain_MCC Lung Opacity[0m:  0.22753, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.27458, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  nan, [1m[36mtrain_MCC Pneumothorax[0m: -0.00628, [1m[36mtrain_MCC Pleural Effusion[0m:  0.38559, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.39374, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.46512, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Cardiom

100%|██████████| 149/149 [00:55<00:00,  2.68it/s]
100%|██████████| 149/149 [00:40<00:00,  3.66it/s]
100%|██████████| 16/16 [00:04<00:00,  3.70it/s]


[1m[32mepoch[0m:    3, [1m[32mseconds_training_epoch[0m: 55.6678
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  47.75075, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.23003, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.07110, [1m[36mtrain_MCC Lung Opacity[0m:  0.23719, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.35526, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  0.01290, [1m[36mtrain_MCC Pneumothorax[0m:  0.07232, [1m[36mtrain_MCC Pleural Effusion[0m:  0.47888, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.43591, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.54386, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Car

100%|██████████| 149/149 [00:54<00:00,  2.75it/s]
100%|██████████| 149/149 [00:41<00:00,  3.56it/s]
100%|██████████| 16/16 [00:04<00:00,  3.71it/s]


[1m[32mepoch[0m:    4, [1m[32mseconds_training_epoch[0m: 54.2008
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  45.73418, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.29865, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.21505, [1m[36mtrain_MCC Lung Opacity[0m:  0.29810, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.41071, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  0.04840, [1m[36mtrain_MCC Pneumothorax[0m:  0.13742, [1m[36mtrain_MCC Pleural Effusion[0m:  0.48408, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.48986, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.58025, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Car

100%|██████████| 149/149 [00:51<00:00,  2.87it/s]
100%|██████████| 149/149 [00:43<00:00,  3.41it/s]
100%|██████████| 16/16 [00:04<00:00,  3.63it/s]


[1m[32mepoch[0m:    5, [1m[32mseconds_training_epoch[0m: 51.978
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  43.46494, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.28604, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.31903, [1m[36mtrain_MCC Lung Opacity[0m:  0.29262, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.45340, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  0.11763, [1m[36mtrain_MCC Pneumothorax[0m:  0.11282, [1m[36mtrain_MCC Pleural Effusion[0m:  0.58710, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.54205, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.51515, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Card

100%|██████████| 149/149 [00:51<00:00,  2.92it/s]
100%|██████████| 149/149 [00:43<00:00,  3.41it/s]
100%|██████████| 16/16 [00:05<00:00,  2.98it/s]


[1m[32mepoch[0m:    6, [1m[32mseconds_training_epoch[0m: 51.0235
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  40.77970, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.45721, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.44708, [1m[36mtrain_MCC Lung Opacity[0m:  0.33508, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.49593, [1m[36mtrain_MCC Consolidation[0m:  0.03529, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  0.15164, [1m[36mtrain_MCC Pneumothorax[0m:  0.26141, [1m[36mtrain_MCC Pleural Effusion[0m:  0.60199, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.57914, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.65693, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision

100%|██████████| 149/149 [00:49<00:00,  3.02it/s]
100%|██████████| 149/149 [00:41<00:00,  3.56it/s]
100%|██████████| 16/16 [00:04<00:00,  3.24it/s]


[1m[32mepoch[0m:    7, [1m[32mseconds_training_epoch[0m: 49.2739
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  37.57477, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.54313, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.06601, [1m[36mtrain_MCC Cardiomegaly[0m:  0.51097, [1m[36mtrain_MCC Lung Opacity[0m:  0.37657, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.56064, [1m[36mtrain_MCC Consolidation[0m:  0.20221, [1m[36mtrain_MCC Pneumonia[0m: -0.00360, [1m[36mtrain_MCC Atelectasis[0m:  0.25093, [1m[36mtrain_MCC Pneumothorax[0m:  0.38916, [1m[36mtrain_MCC Pleural Effusion[0m:  0.65673, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.63239, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.72078, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.50000, [1m[36mtrain_P

100%|██████████| 149/149 [00:48<00:00,  3.09it/s]
100%|██████████| 149/149 [00:39<00:00,  3.73it/s]
100%|██████████| 16/16 [00:04<00:00,  3.31it/s]


[1m[32mepoch[0m:    8, [1m[32mseconds_training_epoch[0m: 48.2718
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  34.94799, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.56702, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.58117, [1m[36mtrain_MCC Lung Opacity[0m:  0.46895, [1m[36mtrain_MCC Lung Lesion[0m:  0.09879, [1m[36mtrain_MCC Edema[0m:  0.61046, [1m[36mtrain_MCC Consolidation[0m:  0.19005, [1m[36mtrain_MCC Pneumonia[0m:  0.25393, [1m[36mtrain_MCC Atelectasis[0m:  0.28480, [1m[36mtrain_MCC Pneumothorax[0m:  0.45903, [1m[36mtrain_MCC Pleural Effusion[0m:  0.69879, [1m[36mtrain_MCC Pleural Other[0m: -0.00259, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.66089, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.70690, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtra

100%|██████████| 149/149 [00:49<00:00,  3.02it/s]
100%|██████████| 149/149 [00:38<00:00,  3.85it/s]
100%|██████████| 16/16 [00:04<00:00,  3.33it/s]


[1m[32mepoch[0m:    9, [1m[32mseconds_training_epoch[0m: 49.3434
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  30.51061, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.68955, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.13883, [1m[36mtrain_MCC Cardiomegaly[0m:  0.67114, [1m[36mtrain_MCC Lung Opacity[0m:  0.54198, [1m[36mtrain_MCC Lung Lesion[0m:  0.15886, [1m[36mtrain_MCC Edema[0m:  0.69060, [1m[36mtrain_MCC Consolidation[0m:  0.32994, [1m[36mtrain_MCC Pneumonia[0m:  0.38421, [1m[36mtrain_MCC Atelectasis[0m:  0.38208, [1m[36mtrain_MCC Pneumothorax[0m:  0.62650, [1m[36mtrain_MCC Pleural Effusion[0m:  0.74123, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  0.15737, [1m[36mtrain_MCC Support Devices[0m:  0.71846, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.79082, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  1.00000, [1m[36

100%|██████████| 149/149 [00:50<00:00,  2.94it/s]
100%|██████████| 149/149 [00:36<00:00,  4.05it/s]
100%|██████████| 16/16 [00:04<00:00,  3.30it/s]


[1m[32mepoch[0m:   10, [1m[32mseconds_training_epoch[0m: 50.7661
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  27.34904, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.73494, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.20182, [1m[36mtrain_MCC Cardiomegaly[0m:  0.70056, [1m[36mtrain_MCC Lung Opacity[0m:  0.58715, [1m[36mtrain_MCC Lung Lesion[0m:  0.30817, [1m[36mtrain_MCC Edema[0m:  0.74133, [1m[36mtrain_MCC Consolidation[0m:  0.40425, [1m[36mtrain_MCC Pneumonia[0m:  0.46541, [1m[36mtrain_MCC Atelectasis[0m:  0.50774, [1m[36mtrain_MCC Pneumothorax[0m:  0.62650, [1m[36mtrain_MCC Pleural Effusion[0m:  0.76873, [1m[36mtrain_MCC Pleural Other[0m:  0.17553, [1m[36mtrain_MCC Fracture[0m:  0.29587, [1m[36mtrain_MCC Support Devices[0m:  0.76160, [1m[36mtrain_MCC AVG[0m:  0.51997, [1m[36mtrain_Precision No Finding[0m:  0.82587, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.63636, 

100%|██████████| 149/149 [00:52<00:00,  2.84it/s]
100%|██████████| 149/149 [00:35<00:00,  4.25it/s]
100%|██████████| 16/16 [00:04<00:00,  3.28it/s]


[1m[32mepoch[0m:   11, [1m[32mseconds_training_epoch[0m: 52.3936
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  22.66054, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.78033, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.33476, [1m[36mtrain_MCC Cardiomegaly[0m:  0.81903, [1m[36mtrain_MCC Lung Opacity[0m:  0.67414, [1m[36mtrain_MCC Lung Lesion[0m:  0.23483, [1m[36mtrain_MCC Edema[0m:  0.78931, [1m[36mtrain_MCC Consolidation[0m:  0.54211, [1m[36mtrain_MCC Pneumonia[0m:  0.56632, [1m[36mtrain_MCC Atelectasis[0m:  0.60507, [1m[36mtrain_MCC Pneumothorax[0m:  0.73069, [1m[36mtrain_MCC Pleural Effusion[0m:  0.82807, [1m[36mtrain_MCC Pleural Other[0m:  0.17306, [1m[36mtrain_MCC Fracture[0m:  0.40725, [1m[36mtrain_MCC Support Devices[0m:  0.82006, [1m[36mtrain_MCC AVG[0m:  0.59321, [1m[36mtrain_Precision No Finding[0m:  0.83871, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.78947, 

100%|██████████| 149/149 [00:53<00:00,  2.76it/s]
100%|██████████| 149/149 [00:33<00:00,  4.41it/s]
100%|██████████| 16/16 [00:04<00:00,  3.28it/s]


[1m[32mepoch[0m:   12, [1m[32mseconds_training_epoch[0m: 53.9687
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  20.27620, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.81901, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.45223, [1m[36mtrain_MCC Cardiomegaly[0m:  0.77120, [1m[36mtrain_MCC Lung Opacity[0m:  0.69980, [1m[36mtrain_MCC Lung Lesion[0m:  0.50757, [1m[36mtrain_MCC Edema[0m:  0.77841, [1m[36mtrain_MCC Consolidation[0m:  0.71594, [1m[36mtrain_MCC Pneumonia[0m:  0.52709, [1m[36mtrain_MCC Atelectasis[0m:  0.69333, [1m[36mtrain_MCC Pneumothorax[0m:  0.79167, [1m[36mtrain_MCC Pleural Effusion[0m:  0.82391, [1m[36mtrain_MCC Pleural Other[0m:  0.46504, [1m[36mtrain_MCC Fracture[0m:  0.49011, [1m[36mtrain_MCC Support Devices[0m:  0.82190, [1m[36mtrain_MCC AVG[0m:  0.66837, [1m[36mtrain_Precision No Finding[0m:  0.86161, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.79412, 

100%|██████████| 149/149 [00:55<00:00,  2.68it/s]
100%|██████████| 149/149 [00:32<00:00,  4.61it/s]
100%|██████████| 16/16 [00:04<00:00,  3.29it/s]


[1m[32mepoch[0m:   13, [1m[32mseconds_training_epoch[0m: 55.5086
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  17.05002, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.84734, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.58246, [1m[36mtrain_MCC Cardiomegaly[0m:  0.85317, [1m[36mtrain_MCC Lung Opacity[0m:  0.76775, [1m[36mtrain_MCC Lung Lesion[0m:  0.50321, [1m[36mtrain_MCC Edema[0m:  0.82761, [1m[36mtrain_MCC Consolidation[0m:  0.72169, [1m[36mtrain_MCC Pneumonia[0m:  0.70686, [1m[36mtrain_MCC Atelectasis[0m:  0.76524, [1m[36mtrain_MCC Pneumothorax[0m:  0.78514, [1m[36mtrain_MCC Pleural Effusion[0m:  0.84026, [1m[36mtrain_MCC Pleural Other[0m:  0.50648, [1m[36mtrain_MCC Fracture[0m:  0.75401, [1m[36mtrain_MCC Support Devices[0m:  0.86055, [1m[36mtrain_MCC AVG[0m:  0.73727, [1m[36mtrain_Precision No Finding[0m:  0.87446, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.85417, 

100%|██████████| 149/149 [00:57<00:00,  2.60it/s]
100%|██████████| 149/149 [00:32<00:00,  4.64it/s]
100%|██████████| 16/16 [00:04<00:00,  3.90it/s]


[1m[32mepoch[0m:   14, [1m[32mseconds_training_epoch[0m: 57.2883
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  14.83794, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.84321, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.64254, [1m[36mtrain_MCC Cardiomegaly[0m:  0.85552, [1m[36mtrain_MCC Lung Opacity[0m:  0.79810, [1m[36mtrain_MCC Lung Lesion[0m:  0.70890, [1m[36mtrain_MCC Edema[0m:  0.85633, [1m[36mtrain_MCC Consolidation[0m:  0.79267, [1m[36mtrain_MCC Pneumonia[0m:  0.72965, [1m[36mtrain_MCC Atelectasis[0m:  0.74215, [1m[36mtrain_MCC Pneumothorax[0m:  0.85403, [1m[36mtrain_MCC Pleural Effusion[0m:  0.87340, [1m[36mtrain_MCC Pleural Other[0m:  0.68619, [1m[36mtrain_MCC Fracture[0m:  0.74806, [1m[36mtrain_MCC Support Devices[0m:  0.88940, [1m[36mtrain_MCC AVG[0m:  0.78715, [1m[36mtrain_Precision No Finding[0m:  0.88393, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.80303, 

100%|██████████| 149/149 [00:57<00:00,  2.58it/s]
100%|██████████| 149/149 [00:32<00:00,  4.52it/s]
100%|██████████| 16/16 [00:03<00:00,  4.15it/s]


[1m[32mepoch[0m:   15, [1m[32mseconds_training_epoch[0m: 57.709
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  12.49240, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.86779, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.80827, [1m[36mtrain_MCC Cardiomegaly[0m:  0.89490, [1m[36mtrain_MCC Lung Opacity[0m:  0.82925, [1m[36mtrain_MCC Lung Lesion[0m:  0.74677, [1m[36mtrain_MCC Edema[0m:  0.87717, [1m[36mtrain_MCC Consolidation[0m:  0.87913, [1m[36mtrain_MCC Pneumonia[0m:  0.77704, [1m[36mtrain_MCC Atelectasis[0m:  0.78802, [1m[36mtrain_MCC Pneumothorax[0m:  0.86974, [1m[36mtrain_MCC Pleural Effusion[0m:  0.87892, [1m[36mtrain_MCC Pleural Other[0m:  0.72722, [1m[36mtrain_MCC Fracture[0m:  0.79799, [1m[36mtrain_MCC Support Devices[0m:  0.89563, [1m[36mtrain_MCC AVG[0m:  0.83128, [1m[36mtrain_Precision No Finding[0m:  0.90265, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.89157, 

100%|██████████| 149/149 [00:56<00:00,  2.64it/s]
100%|██████████| 149/149 [00:34<00:00,  4.36it/s]
100%|██████████| 16/16 [00:03<00:00,  4.10it/s]


[1m[32mepoch[0m:   16, [1m[32mseconds_training_epoch[0m: 56.3409
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  11.83996, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.87779, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.75096, [1m[36mtrain_MCC Cardiomegaly[0m:  0.90371, [1m[36mtrain_MCC Lung Opacity[0m:  0.83109, [1m[36mtrain_MCC Lung Lesion[0m:  0.78489, [1m[36mtrain_MCC Edema[0m:  0.88214, [1m[36mtrain_MCC Consolidation[0m:  0.84882, [1m[36mtrain_MCC Pneumonia[0m:  0.78185, [1m[36mtrain_MCC Atelectasis[0m:  0.85094, [1m[36mtrain_MCC Pneumothorax[0m:  0.84300, [1m[36mtrain_MCC Pleural Effusion[0m:  0.91694, [1m[36mtrain_MCC Pleural Other[0m:  0.62208, [1m[36mtrain_MCC Fracture[0m:  0.81007, [1m[36mtrain_MCC Support Devices[0m:  0.87404, [1m[36mtrain_MCC AVG[0m:  0.82702, [1m[36mtrain_Precision No Finding[0m:  0.90789, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.86842, 

100%|██████████| 149/149 [00:55<00:00,  2.70it/s]
100%|██████████| 149/149 [00:36<00:00,  4.13it/s]
100%|██████████| 16/16 [00:03<00:00,  4.07it/s]


[1m[32mepoch[0m:   17, [1m[32mseconds_training_epoch[0m: 55.2228
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  10.46720, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.93557, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.86042, [1m[36mtrain_MCC Cardiomegaly[0m:  0.89822, [1m[36mtrain_MCC Lung Opacity[0m:  0.87426, [1m[36mtrain_MCC Lung Lesion[0m:  0.81101, [1m[36mtrain_MCC Edema[0m:  0.89904, [1m[36mtrain_MCC Consolidation[0m:  0.87623, [1m[36mtrain_MCC Pneumonia[0m:  0.88379, [1m[36mtrain_MCC Atelectasis[0m:  0.83776, [1m[36mtrain_MCC Pneumothorax[0m:  0.86335, [1m[36mtrain_MCC Pleural Effusion[0m:  0.92559, [1m[36mtrain_MCC Pleural Other[0m:  0.84604, [1m[36mtrain_MCC Fracture[0m:  0.86277, [1m[36mtrain_MCC Support Devices[0m:  0.88937, [1m[36mtrain_MCC AVG[0m:  0.87596, [1m[36mtrain_Precision No Finding[0m:  0.95652, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.94048, 

100%|██████████| 149/149 [00:53<00:00,  2.79it/s]
100%|██████████| 149/149 [00:37<00:00,  4.02it/s]
100%|██████████| 16/16 [00:03<00:00,  4.01it/s]


[1m[32mepoch[0m:   18, [1m[32mseconds_training_epoch[0m: 53.3466
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  9.68130, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.91947, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.84450, [1m[36mtrain_MCC Cardiomegaly[0m:  0.90556, [1m[36mtrain_MCC Lung Opacity[0m:  0.83842, [1m[36mtrain_MCC Lung Lesion[0m:  0.78734, [1m[36mtrain_MCC Edema[0m:  0.91217, [1m[36mtrain_MCC Consolidation[0m:  0.86386, [1m[36mtrain_MCC Pneumonia[0m:  0.77927, [1m[36mtrain_MCC Atelectasis[0m:  0.89735, [1m[36mtrain_MCC Pneumothorax[0m:  0.90456, [1m[36mtrain_MCC Pleural Effusion[0m:  0.91869, [1m[36mtrain_MCC Pleural Other[0m:  0.95131, [1m[36mtrain_MCC Fracture[0m:  0.83758, [1m[36mtrain_MCC Support Devices[0m:  0.91455, [1m[36mtrain_MCC AVG[0m:  0.87676, [1m[36mtrain_Precision No Finding[0m:  0.93191, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.90805, 

100%|██████████| 149/149 [00:52<00:00,  2.86it/s]
100%|██████████| 149/149 [00:38<00:00,  3.88it/s]
100%|██████████| 16/16 [00:03<00:00,  4.12it/s]


[1m[32mepoch[0m:   19, [1m[32mseconds_training_epoch[0m: 52.1547
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  8.68400, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.91192, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.84741, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93149, [1m[36mtrain_MCC Lung Opacity[0m:  0.85775, [1m[36mtrain_MCC Lung Lesion[0m:  0.88870, [1m[36mtrain_MCC Edema[0m:  0.92940, [1m[36mtrain_MCC Consolidation[0m:  0.89510, [1m[36mtrain_MCC Pneumonia[0m:  0.86917, [1m[36mtrain_MCC Atelectasis[0m:  0.90125, [1m[36mtrain_MCC Pneumothorax[0m:  0.88339, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93420, [1m[36mtrain_MCC Pleural Other[0m:  0.90014, [1m[36mtrain_MCC Fracture[0m:  0.91758, [1m[36mtrain_MCC Support Devices[0m:  0.91814, [1m[36mtrain_MCC AVG[0m:  0.89897, [1m[36mtrain_Precision No Finding[0m:  0.93103, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96154, 

100%|██████████| 149/149 [00:50<00:00,  2.96it/s]
100%|██████████| 149/149 [00:39<00:00,  3.74it/s]
100%|██████████| 16/16 [00:03<00:00,  4.25it/s]


[1m[32mepoch[0m:   20, [1m[32mseconds_training_epoch[0m: 50.3984
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  7.59288, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95236, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.92977, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93121, [1m[36mtrain_MCC Lung Opacity[0m:  0.90453, [1m[36mtrain_MCC Lung Lesion[0m:  0.90006, [1m[36mtrain_MCC Edema[0m:  0.92565, [1m[36mtrain_MCC Consolidation[0m:  0.86584, [1m[36mtrain_MCC Pneumonia[0m:  0.87868, [1m[36mtrain_MCC Atelectasis[0m:  0.91842, [1m[36mtrain_MCC Pneumothorax[0m:  0.93724, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94294, [1m[36mtrain_MCC Pleural Other[0m:  0.86682, [1m[36mtrain_MCC Fracture[0m:  0.91758, [1m[36mtrain_MCC Support Devices[0m:  0.90553, [1m[36mtrain_MCC AVG[0m:  0.91262, [1m[36mtrain_Precision No Finding[0m:  0.96970, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.95745, 

100%|██████████| 149/149 [00:48<00:00,  3.05it/s]
100%|██████████| 149/149 [00:40<00:00,  3.66it/s]
100%|██████████| 16/16 [00:04<00:00,  3.51it/s]


[1m[32mepoch[0m:   21, [1m[32mseconds_training_epoch[0m: 48.8464
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  7.61992, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94298, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.84450, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93596, [1m[36mtrain_MCC Lung Opacity[0m:  0.90275, [1m[36mtrain_MCC Lung Lesion[0m:  0.86597, [1m[36mtrain_MCC Edema[0m:  0.93810, [1m[36mtrain_MCC Consolidation[0m:  0.91137, [1m[36mtrain_MCC Pneumonia[0m:  0.91975, [1m[36mtrain_MCC Atelectasis[0m:  0.89299, [1m[36mtrain_MCC Pneumothorax[0m:  0.92392, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93518, [1m[36mtrain_MCC Pleural Other[0m:  0.79908, [1m[36mtrain_MCC Fracture[0m:  0.93862, [1m[36mtrain_MCC Support Devices[0m:  0.91273, [1m[36mtrain_MCC AVG[0m:  0.90456, [1m[36mtrain_Precision No Finding[0m:  0.95708, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.90805, 

100%|██████████| 149/149 [00:47<00:00,  3.13it/s]
100%|██████████| 149/149 [00:40<00:00,  3.67it/s]
100%|██████████| 16/16 [00:04<00:00,  3.35it/s]


[1m[32mepoch[0m:   22, [1m[32mseconds_training_epoch[0m: 47.6813
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  7.45060, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.90017, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.91378, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95462, [1m[36mtrain_MCC Lung Opacity[0m:  0.90086, [1m[36mtrain_MCC Lung Lesion[0m:  0.93454, [1m[36mtrain_MCC Edema[0m:  0.91728, [1m[36mtrain_MCC Consolidation[0m:  0.94437, [1m[36mtrain_MCC Pneumonia[0m:  0.90316, [1m[36mtrain_MCC Atelectasis[0m:  0.90710, [1m[36mtrain_MCC Pneumothorax[0m:  0.91862, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95066, [1m[36mtrain_MCC Pleural Other[0m:  0.91750, [1m[36mtrain_MCC Fracture[0m:  0.93886, [1m[36mtrain_MCC Support Devices[0m:  0.90744, [1m[36mtrain_MCC AVG[0m:  0.92207, [1m[36mtrain_Precision No Finding[0m:  0.91845, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.93684, 

100%|██████████| 149/149 [00:46<00:00,  3.19it/s]
100%|██████████| 149/149 [00:40<00:00,  3.68it/s]
100%|██████████| 16/16 [00:04<00:00,  3.29it/s]


[1m[32mepoch[0m:   23, [1m[32mseconds_training_epoch[0m: 46.6419
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  7.56086, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.91563, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.89137, [1m[36mtrain_MCC Cardiomegaly[0m:  0.91466, [1m[36mtrain_MCC Lung Opacity[0m:  0.89732, [1m[36mtrain_MCC Lung Lesion[0m:  0.92923, [1m[36mtrain_MCC Edema[0m:  0.93210, [1m[36mtrain_MCC Consolidation[0m:  0.92649, [1m[36mtrain_MCC Pneumonia[0m:  0.82623, [1m[36mtrain_MCC Atelectasis[0m:  0.91454, [1m[36mtrain_MCC Pneumothorax[0m:  0.92111, [1m[36mtrain_MCC Pleural Effusion[0m:  0.92559, [1m[36mtrain_MCC Pleural Other[0m:  0.91750, [1m[36mtrain_MCC Fracture[0m:  0.90420, [1m[36mtrain_MCC Support Devices[0m:  0.93343, [1m[36mtrain_MCC AVG[0m:  0.91067, [1m[36mtrain_Precision No Finding[0m:  0.95495, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.92473, 

100%|██████████| 149/149 [00:48<00:00,  3.07it/s]
100%|██████████| 149/149 [00:39<00:00,  3.80it/s]
100%|██████████| 16/16 [00:04<00:00,  3.34it/s]


[1m[32mepoch[0m:   24, [1m[32mseconds_training_epoch[0m: 48.4964
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  6.86014, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94051, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.91807, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94610, [1m[36mtrain_MCC Lung Opacity[0m:  0.94033, [1m[36mtrain_MCC Lung Lesion[0m:  0.95668, [1m[36mtrain_MCC Edema[0m:  0.94067, [1m[36mtrain_MCC Consolidation[0m:  0.90211, [1m[36mtrain_MCC Pneumonia[0m:  0.94044, [1m[36mtrain_MCC Atelectasis[0m:  0.91619, [1m[36mtrain_MCC Pneumothorax[0m:  0.88802, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93519, [1m[36mtrain_MCC Pleural Other[0m:  0.93506, [1m[36mtrain_MCC Fracture[0m:  0.95258, [1m[36mtrain_MCC Support Devices[0m:  0.92532, [1m[36mtrain_MCC AVG[0m:  0.93123, [1m[36mtrain_Precision No Finding[0m:  0.95690, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96667, 

100%|██████████| 149/149 [00:49<00:00,  3.00it/s]
100%|██████████| 149/149 [00:37<00:00,  3.99it/s]
100%|██████████| 16/16 [00:04<00:00,  3.28it/s]


[1m[32mepoch[0m:   25, [1m[32mseconds_training_epoch[0m: 49.7301
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.91234, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.93594, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95174, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95864, [1m[36mtrain_MCC Lung Opacity[0m:  0.90453, [1m[36mtrain_MCC Lung Lesion[0m:  0.88981, [1m[36mtrain_MCC Edema[0m:  0.94198, [1m[36mtrain_MCC Consolidation[0m:  0.94746, [1m[36mtrain_MCC Pneumonia[0m:  0.87093, [1m[36mtrain_MCC Atelectasis[0m:  0.90650, [1m[36mtrain_MCC Pneumothorax[0m:  0.93207, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94871, [1m[36mtrain_MCC Pleural Other[0m:  1.00000, [1m[36mtrain_MCC Fracture[0m:  0.93224, [1m[36mtrain_MCC Support Devices[0m:  0.95412, [1m[36mtrain_MCC AVG[0m:  0.93391, [1m[36mtrain_Precision No Finding[0m:  0.94872, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96875, 

100%|██████████| 149/149 [00:51<00:00,  2.92it/s]
100%|██████████| 149/149 [00:35<00:00,  4.15it/s]
100%|██████████| 16/16 [00:04<00:00,  3.32it/s]


[1m[32mepoch[0m:   26, [1m[32mseconds_training_epoch[0m: 51.0899
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.77387, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94316, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.89216, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93337, [1m[36mtrain_MCC Lung Opacity[0m:  0.93023, [1m[36mtrain_MCC Lung Lesion[0m:  0.97305, [1m[36mtrain_MCC Edema[0m:  0.92709, [1m[36mtrain_MCC Consolidation[0m:  0.95491, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.92456, [1m[36mtrain_MCC Pneumothorax[0m:  0.94010, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95940, [1m[36mtrain_MCC Pleural Other[0m:  0.90068, [1m[36mtrain_MCC Fracture[0m:  0.93862, [1m[36mtrain_MCC Support Devices[0m:  0.93705, [1m[36mtrain_MCC AVG[0m:  0.93611, [1m[36mtrain_Precision No Finding[0m:  0.95319, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.91579, 

100%|██████████| 149/149 [00:52<00:00,  2.83it/s]
100%|██████████| 149/149 [00:34<00:00,  4.30it/s]
100%|██████████| 16/16 [00:04<00:00,  3.33it/s]


[1m[32mepoch[0m:   27, [1m[32mseconds_training_epoch[0m: 52.6156
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.46365, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.97632, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.93503, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95262, [1m[36mtrain_MCC Lung Opacity[0m:  0.93207, [1m[36mtrain_MCC Lung Lesion[0m:  0.91829, [1m[36mtrain_MCC Edema[0m:  0.94813, [1m[36mtrain_MCC Consolidation[0m:  0.91579, [1m[36mtrain_MCC Pneumonia[0m:  0.93015, [1m[36mtrain_MCC Atelectasis[0m:  0.93134, [1m[36mtrain_MCC Pneumothorax[0m:  0.93116, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94396, [1m[36mtrain_MCC Pleural Other[0m:  0.96780, [1m[36mtrain_MCC Fracture[0m:  0.93283, [1m[36mtrain_MCC Support Devices[0m:  0.95771, [1m[36mtrain_MCC AVG[0m:  0.94094, [1m[36mtrain_Precision No Finding[0m:  0.98298, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96774, 

100%|██████████| 149/149 [00:54<00:00,  2.74it/s]
100%|██████████| 149/149 [00:33<00:00,  4.48it/s]
100%|██████████| 16/16 [00:04<00:00,  3.25it/s]


[1m[32mepoch[0m:   28, [1m[32mseconds_training_epoch[0m: 54.4634
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  6.17141, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.93842, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.84288, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95008, [1m[36mtrain_MCC Lung Opacity[0m:  0.92564, [1m[36mtrain_MCC Lung Lesion[0m:  0.89135, [1m[36mtrain_MCC Edema[0m:  0.94723, [1m[36mtrain_MCC Consolidation[0m:  0.95116, [1m[36mtrain_MCC Pneumonia[0m:  0.94044, [1m[36mtrain_MCC Atelectasis[0m:  0.93901, [1m[36mtrain_MCC Pneumothorax[0m:  0.95296, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94878, [1m[36mtrain_MCC Pleural Other[0m:  0.93455, [1m[36mtrain_MCC Fracture[0m:  0.91143, [1m[36mtrain_MCC Support Devices[0m:  0.94062, [1m[36mtrain_MCC AVG[0m:  0.92961, [1m[36mtrain_Precision No Finding[0m:  0.94894, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.87234, 

100%|██████████| 149/149 [00:56<00:00,  2.66it/s]
100%|██████████| 149/149 [00:31<00:00,  4.71it/s]
100%|██████████| 16/16 [00:05<00:00,  3.17it/s]


[1m[32mepoch[0m:   29, [1m[32mseconds_training_epoch[0m: 56.0039
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.85699, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.93557, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94595, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95025, [1m[36mtrain_MCC Lung Opacity[0m:  0.92291, [1m[36mtrain_MCC Lung Lesion[0m:  0.91781, [1m[36mtrain_MCC Edema[0m:  0.94306, [1m[36mtrain_MCC Consolidation[0m:  0.91980, [1m[36mtrain_MCC Pneumonia[0m:  0.92032, [1m[36mtrain_MCC Atelectasis[0m:  0.94796, [1m[36mtrain_MCC Pneumothorax[0m:  0.94655, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95163, [1m[36mtrain_MCC Pleural Other[0m:  0.92204, [1m[36mtrain_MCC Fracture[0m:  0.91734, [1m[36mtrain_MCC Support Devices[0m:  0.93883, [1m[36mtrain_MCC AVG[0m:  0.93429, [1m[36mtrain_Precision No Finding[0m:  0.95652, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97849, 

100%|██████████| 149/149 [00:57<00:00,  2.61it/s]
100%|██████████| 149/149 [00:31<00:00,  4.68it/s]
100%|██████████| 16/16 [00:04<00:00,  3.87it/s]


[1m[32mepoch[0m:   30, [1m[32mseconds_training_epoch[0m: 57.0162
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.57695, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94035, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95210, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96482, [1m[36mtrain_MCC Lung Opacity[0m:  0.92566, [1m[36mtrain_MCC Lung Lesion[0m:  0.94554, [1m[36mtrain_MCC Edema[0m:  0.93844, [1m[36mtrain_MCC Consolidation[0m:  0.95454, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.94431, [1m[36mtrain_MCC Pneumothorax[0m:  0.96564, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94486, [1m[36mtrain_MCC Pleural Other[0m:  0.91803, [1m[36mtrain_MCC Fracture[0m:  0.95323, [1m[36mtrain_MCC Support Devices[0m:  0.94602, [1m[36mtrain_MCC AVG[0m:  0.94605, [1m[36mtrain_Precision No Finding[0m:  0.96087, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.95918, 

100%|██████████| 149/149 [00:57<00:00,  2.61it/s]
100%|██████████| 149/149 [00:33<00:00,  4.43it/s]
100%|██████████| 16/16 [00:03<00:00,  4.19it/s]


[1m[32mepoch[0m:   31, [1m[32mseconds_training_epoch[0m: 57.0469
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.58326, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96211, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95149, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95864, [1m[36mtrain_MCC Lung Opacity[0m:  0.93482, [1m[36mtrain_MCC Lung Lesion[0m:  0.93454, [1m[36mtrain_MCC Edema[0m:  0.94818, [1m[36mtrain_MCC Consolidation[0m:  0.94885, [1m[36mtrain_MCC Pneumonia[0m:  0.93015, [1m[36mtrain_MCC Atelectasis[0m:  0.92984, [1m[36mtrain_MCC Pneumothorax[0m:  0.94371, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93038, [1m[36mtrain_MCC Pleural Other[0m:  0.95131, [1m[36mtrain_MCC Fracture[0m:  0.89866, [1m[36mtrain_MCC Support Devices[0m:  0.93882, [1m[36mtrain_MCC AVG[0m:  0.94011, [1m[36mtrain_Precision No Finding[0m:  0.97021, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97872, 

100%|██████████| 149/149 [00:55<00:00,  2.68it/s]
100%|██████████| 149/149 [00:34<00:00,  4.27it/s]
100%|██████████| 16/16 [00:03<00:00,  4.12it/s]


[1m[32mepoch[0m:   32, [1m[32mseconds_training_epoch[0m: 55.6208
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.52742, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95737, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94063, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96498, [1m[36mtrain_MCC Lung Opacity[0m:  0.92472, [1m[36mtrain_MCC Lung Lesion[0m:  0.94055, [1m[36mtrain_MCC Edema[0m:  0.96552, [1m[36mtrain_MCC Consolidation[0m:  0.93377, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.95547, [1m[36mtrain_MCC Pneumothorax[0m:  0.97197, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96904, [1m[36mtrain_MCC Pleural Other[0m:  0.91803, [1m[36mtrain_MCC Fracture[0m:  0.97343, [1m[36mtrain_MCC Support Devices[0m:  0.95142, [1m[36mtrain_MCC AVG[0m:  0.95129, [1m[36mtrain_Precision No Finding[0m:  0.96596, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96809, 

100%|██████████| 149/149 [00:54<00:00,  2.75it/s]
100%|██████████| 149/149 [00:36<00:00,  4.10it/s]
100%|██████████| 16/16 [00:03<00:00,  4.18it/s]


[1m[32mepoch[0m:   33, [1m[32mseconds_training_epoch[0m: 54.2024
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.38548, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96467, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94145, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96489, [1m[36mtrain_MCC Lung Opacity[0m:  0.93758, [1m[36mtrain_MCC Lung Lesion[0m:  0.95654, [1m[36mtrain_MCC Edema[0m:  0.96664, [1m[36mtrain_MCC Consolidation[0m:  0.94437, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.95010, [1m[36mtrain_MCC Pneumothorax[0m:  0.94985, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95937, [1m[36mtrain_MCC Pleural Other[0m:  0.93455, [1m[36mtrain_MCC Fracture[0m:  0.97312, [1m[36mtrain_MCC Support Devices[0m:  0.95232, [1m[36mtrain_MCC AVG[0m:  0.95333, [1m[36mtrain_Precision No Finding[0m:  0.96639, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.94898, 

100%|██████████| 149/149 [00:52<00:00,  2.84it/s]
100%|██████████| 149/149 [00:37<00:00,  3.95it/s]
100%|██████████| 16/16 [00:03<00:00,  4.17it/s]


[1m[32mepoch[0m:   34, [1m[32mseconds_training_epoch[0m: 52.5579
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.05000, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.93888, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96249, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94599, [1m[36mtrain_MCC Lung Opacity[0m:  0.92289, [1m[36mtrain_MCC Lung Lesion[0m:  0.91382, [1m[36mtrain_MCC Edema[0m:  0.96687, [1m[36mtrain_MCC Consolidation[0m:  0.92679, [1m[36mtrain_MCC Pneumonia[0m:  0.91208, [1m[36mtrain_MCC Atelectasis[0m:  0.93901, [1m[36mtrain_MCC Pneumothorax[0m:  0.95959, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96227, [1m[36mtrain_MCC Pleural Other[0m:  0.96829, [1m[36mtrain_MCC Fracture[0m:  0.93283, [1m[36mtrain_MCC Support Devices[0m:  0.94782, [1m[36mtrain_MCC AVG[0m:  0.94283, [1m[36mtrain_Precision No Finding[0m:  0.94142, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97917, 

100%|██████████| 149/149 [00:51<00:00,  2.91it/s]
100%|██████████| 149/149 [00:39<00:00,  3.81it/s]
100%|██████████| 16/16 [00:03<00:00,  4.09it/s]


[1m[32mepoch[0m:   35, [1m[32mseconds_training_epoch[0m: 51.1492
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.73850, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95968, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96235, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96051, [1m[36mtrain_MCC Lung Opacity[0m:  0.93849, [1m[36mtrain_MCC Lung Lesion[0m:  0.91781, [1m[36mtrain_MCC Edema[0m:  0.96421, [1m[36mtrain_MCC Consolidation[0m:  0.95474, [1m[36mtrain_MCC Pneumonia[0m:  0.89085, [1m[36mtrain_MCC Atelectasis[0m:  0.94431, [1m[36mtrain_MCC Pneumothorax[0m:  0.93767, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95067, [1m[36mtrain_MCC Pleural Other[0m:  0.96829, [1m[36mtrain_MCC Fracture[0m:  0.93886, [1m[36mtrain_MCC Support Devices[0m:  0.95053, [1m[36mtrain_MCC AVG[0m:  0.94564, [1m[36mtrain_Precision No Finding[0m:  0.97009, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.98936, 

100%|██████████| 149/149 [00:49<00:00,  3.01it/s]
100%|██████████| 149/149 [00:40<00:00,  3.68it/s]
100%|██████████| 16/16 [00:03<00:00,  4.01it/s]


[1m[32mepoch[0m:   36, [1m[32mseconds_training_epoch[0m: 49.4836
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.42426, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96951, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.93642, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94423, [1m[36mtrain_MCC Lung Opacity[0m:  0.92656, [1m[36mtrain_MCC Lung Lesion[0m:  0.96798, [1m[36mtrain_MCC Edema[0m:  0.96296, [1m[36mtrain_MCC Consolidation[0m:  0.94416, [1m[36mtrain_MCC Pneumonia[0m:  0.94099, [1m[36mtrain_MCC Atelectasis[0m:  0.95749, [1m[36mtrain_MCC Pneumothorax[0m:  0.93794, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96809, [1m[36mtrain_MCC Pleural Other[0m:  0.93506, [1m[36mtrain_MCC Fracture[0m:  0.92472, [1m[36mtrain_MCC Support Devices[0m:  0.95235, [1m[36mtrain_MCC AVG[0m:  0.94775, [1m[36mtrain_Precision No Finding[0m:  0.96667, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.93939, 

100%|██████████| 149/149 [00:48<00:00,  3.10it/s]
100%|██████████| 149/149 [00:40<00:00,  3.66it/s]
100%|██████████| 16/16 [00:04<00:00,  3.25it/s]


[1m[32mepoch[0m:   37, [1m[32mseconds_training_epoch[0m: 48.0851
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.83628, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95249, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96796, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93780, [1m[36mtrain_MCC Lung Opacity[0m:  0.94767, [1m[36mtrain_MCC Lung Lesion[0m:  0.93992, [1m[36mtrain_MCC Edema[0m:  0.95186, [1m[36mtrain_MCC Consolidation[0m:  0.95133, [1m[36mtrain_MCC Pneumonia[0m:  0.96126, [1m[36mtrain_MCC Atelectasis[0m:  0.94811, [1m[36mtrain_MCC Pneumothorax[0m:  0.96295, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94681, [1m[36mtrain_MCC Pleural Other[0m:  0.91803, [1m[36mtrain_MCC Fracture[0m:  0.95381, [1m[36mtrain_MCC Support Devices[0m:  0.94602, [1m[36mtrain_MCC AVG[0m:  0.94900, [1m[36mtrain_Precision No Finding[0m:  0.96567, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97938, 

100%|██████████| 149/149 [00:46<00:00,  3.20it/s]
100%|██████████| 149/149 [00:40<00:00,  3.67it/s]
100%|██████████| 16/16 [00:04<00:00,  3.27it/s]


[1m[32mepoch[0m:   38, [1m[32mseconds_training_epoch[0m: 46.5213
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.84583, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.98818, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95701, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96086, [1m[36mtrain_MCC Lung Opacity[0m:  0.96330, [1m[36mtrain_MCC Lung Lesion[0m:  0.93454, [1m[36mtrain_MCC Edema[0m:  0.96665, [1m[36mtrain_MCC Consolidation[0m:  0.96880, [1m[36mtrain_MCC Pneumonia[0m:  0.90982, [1m[36mtrain_MCC Atelectasis[0m:  0.95380, [1m[36mtrain_MCC Pneumothorax[0m:  0.96571, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96326, [1m[36mtrain_MCC Pleural Other[0m:  0.91803, [1m[36mtrain_MCC Fracture[0m:  0.95323, [1m[36mtrain_MCC Support Devices[0m:  0.96132, [1m[36mtrain_MCC AVG[0m:  0.95461, [1m[36mtrain_Precision No Finding[0m:  0.99153, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97895, 

100%|██████████| 149/149 [00:48<00:00,  3.10it/s]
100%|██████████| 149/149 [00:39<00:00,  3.73it/s]
100%|██████████| 16/16 [00:04<00:00,  3.28it/s]


[1m[32mepoch[0m:   39, [1m[32mseconds_training_epoch[0m: 48.015
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.19112, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96685, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.93080, [1m[36mtrain_MCC Cardiomegaly[0m:  0.97729, [1m[36mtrain_MCC Lung Opacity[0m:  0.94676, [1m[36mtrain_MCC Lung Lesion[0m:  0.94616, [1m[36mtrain_MCC Edema[0m:  0.97049, [1m[36mtrain_MCC Consolidation[0m:  0.95474, [1m[36mtrain_MCC Pneumonia[0m:  0.97056, [1m[36mtrain_MCC Atelectasis[0m:  0.97041, [1m[36mtrain_MCC Pneumothorax[0m:  0.91532, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96809, [1m[36mtrain_MCC Pleural Other[0m:  0.98402, [1m[36mtrain_MCC Fracture[0m:  0.95282, [1m[36mtrain_MCC Support Devices[0m:  0.95682, [1m[36mtrain_MCC AVG[0m:  0.95794, [1m[36mtrain_Precision No Finding[0m:  0.97447, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.93878, [

100%|██████████| 149/149 [00:49<00:00,  3.03it/s]
100%|██████████| 149/149 [00:38<00:00,  3.85it/s]
100%|██████████| 16/16 [00:04<00:00,  3.32it/s]


[1m[32mepoch[0m:   40, [1m[32mseconds_training_epoch[0m: 49.2443
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.73679, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95018, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95701, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96482, [1m[36mtrain_MCC Lung Opacity[0m:  0.92932, [1m[36mtrain_MCC Lung Lesion[0m:  0.96772, [1m[36mtrain_MCC Edema[0m:  0.95075, [1m[36mtrain_MCC Consolidation[0m:  0.96172, [1m[36mtrain_MCC Pneumonia[0m:  0.93071, [1m[36mtrain_MCC Atelectasis[0m:  0.92942, [1m[36mtrain_MCC Pneumothorax[0m:  0.91602, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95847, [1m[36mtrain_MCC Pleural Other[0m:  0.96780, [1m[36mtrain_MCC Fracture[0m:  0.96630, [1m[36mtrain_MCC Support Devices[0m:  0.94962, [1m[36mtrain_MCC AVG[0m:  0.94999, [1m[36mtrain_Precision No Finding[0m:  0.96154, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97895, 

100%|██████████| 149/149 [00:50<00:00,  2.94it/s]
100%|██████████| 149/149 [00:37<00:00,  3.99it/s]
100%|██████████| 16/16 [00:04<00:00,  3.25it/s]


[1m[32mepoch[0m:   41, [1m[32mseconds_training_epoch[0m: 50.6597
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.54973, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96926, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95174, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96700, [1m[36mtrain_MCC Lung Opacity[0m:  0.94400, [1m[36mtrain_MCC Lung Lesion[0m:  0.94102, [1m[36mtrain_MCC Edema[0m:  0.93945, [1m[36mtrain_MCC Consolidation[0m:  0.95491, [1m[36mtrain_MCC Pneumonia[0m:  0.94099, [1m[36mtrain_MCC Atelectasis[0m:  0.94830, [1m[36mtrain_MCC Pneumothorax[0m:  0.92519, [1m[36mtrain_MCC Pleural Effusion[0m:  0.97001, [1m[36mtrain_MCC Pleural Other[0m:  0.88739, [1m[36mtrain_MCC Fracture[0m:  0.93283, [1m[36mtrain_MCC Support Devices[0m:  0.93795, [1m[36mtrain_MCC AVG[0m:  0.94358, [1m[36mtrain_Precision No Finding[0m:  0.97458, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96875, 

100%|██████████| 149/149 [00:52<00:00,  2.86it/s]
100%|██████████| 149/149 [00:36<00:00,  4.14it/s]
100%|██████████| 16/16 [00:04<00:00,  3.32it/s]


[1m[32mepoch[0m:   42, [1m[32mseconds_training_epoch[0m: 52.177
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.03525, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.97399, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95210, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95450, [1m[36mtrain_MCC Lung Opacity[0m:  0.93574, [1m[36mtrain_MCC Lung Lesion[0m:  0.93029, [1m[36mtrain_MCC Edema[0m:  0.96316, [1m[36mtrain_MCC Consolidation[0m:  0.94746, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.96119, [1m[36mtrain_MCC Pneumothorax[0m:  0.97197, [1m[36mtrain_MCC Pleural Effusion[0m:  0.97679, [1m[36mtrain_MCC Pleural Other[0m:  0.91803, [1m[36mtrain_MCC Fracture[0m:  0.95973, [1m[36mtrain_MCC Support Devices[0m:  0.95142, [1m[36mtrain_MCC AVG[0m:  0.95340, [1m[36mtrain_Precision No Finding[0m:  0.97881, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.95918, [

100%|██████████| 149/149 [00:53<00:00,  2.78it/s]
100%|██████████| 149/149 [00:34<00:00,  4.36it/s]
100%|██████████| 16/16 [00:04<00:00,  3.26it/s]


[1m[32mepoch[0m:   43, [1m[32mseconds_training_epoch[0m: 53.5542
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.22870, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95705, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95726, [1m[36mtrain_MCC Cardiomegaly[0m:  0.97311, [1m[36mtrain_MCC Lung Opacity[0m:  0.94768, [1m[36mtrain_MCC Lung Lesion[0m:  0.94055, [1m[36mtrain_MCC Edema[0m:  0.94336, [1m[36mtrain_MCC Consolidation[0m:  0.95830, [1m[36mtrain_MCC Pneumonia[0m:  0.92126, [1m[36mtrain_MCC Atelectasis[0m:  0.96127, [1m[36mtrain_MCC Pneumothorax[0m:  0.92462, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95937, [1m[36mtrain_MCC Pleural Other[0m:  0.98402, [1m[36mtrain_MCC Fracture[0m:  0.97990, [1m[36mtrain_MCC Support Devices[0m:  0.96131, [1m[36mtrain_MCC AVG[0m:  0.95493, [1m[36mtrain_Precision No Finding[0m:  0.97817, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96907, 

100%|██████████| 149/149 [00:55<00:00,  2.69it/s]
100%|██████████| 149/149 [00:33<00:00,  4.50it/s]
100%|██████████| 16/16 [00:04<00:00,  3.30it/s]


[1m[32mepoch[0m:   44, [1m[32mseconds_training_epoch[0m: 55.3011
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.71085, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.97866, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95701, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96686, [1m[36mtrain_MCC Lung Opacity[0m:  0.96053, [1m[36mtrain_MCC Lung Lesion[0m:  0.96207, [1m[36mtrain_MCC Edema[0m:  0.95437, [1m[36mtrain_MCC Consolidation[0m:  0.95817, [1m[36mtrain_MCC Pneumonia[0m:  0.94099, [1m[36mtrain_MCC Atelectasis[0m:  0.94830, [1m[36mtrain_MCC Pneumothorax[0m:  0.95657, [1m[36mtrain_MCC Pleural Effusion[0m:  0.97872, [1m[36mtrain_MCC Pleural Other[0m:  0.95181, [1m[36mtrain_MCC Fracture[0m:  0.97319, [1m[36mtrain_MCC Support Devices[0m:  0.95952, [1m[36mtrain_MCC AVG[0m:  0.96048, [1m[36mtrain_Precision No Finding[0m:  0.98718, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97895, 

100%|██████████| 149/149 [00:56<00:00,  2.62it/s]
100%|██████████| 149/149 [00:32<00:00,  4.64it/s]
100%|██████████| 16/16 [00:04<00:00,  3.72it/s]


[1m[32mepoch[0m:   45, [1m[32mseconds_training_epoch[0m: 56.7805
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.07574, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95018, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.92015, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96498, [1m[36mtrain_MCC Lung Opacity[0m:  0.94861, [1m[36mtrain_MCC Lung Lesion[0m:  0.93490, [1m[36mtrain_MCC Edema[0m:  0.95688, [1m[36mtrain_MCC Consolidation[0m:  0.96203, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.95380, [1m[36mtrain_MCC Pneumothorax[0m:  0.95036, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96809, [1m[36mtrain_MCC Pleural Other[0m:  0.95181, [1m[36mtrain_MCC Fracture[0m:  0.96636, [1m[36mtrain_MCC Support Devices[0m:  0.95952, [1m[36mtrain_MCC AVG[0m:  0.95278, [1m[36mtrain_Precision No Finding[0m:  0.96154, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.92857, 

100%|██████████| 149/149 [00:57<00:00,  2.59it/s]
100%|██████████| 149/149 [00:32<00:00,  4.56it/s]
100%|██████████| 16/16 [00:03<00:00,  4.13it/s]


[1m[32mepoch[0m:   46, [1m[32mseconds_training_epoch[0m: 57.5146
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.98765, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96926, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.97325, [1m[36mtrain_MCC Cardiomegaly[0m:  0.97106, [1m[36mtrain_MCC Lung Opacity[0m:  0.93574, [1m[36mtrain_MCC Lung Lesion[0m:  0.96247, [1m[36mtrain_MCC Edema[0m:  0.95586, [1m[36mtrain_MCC Consolidation[0m:  0.97934, [1m[36mtrain_MCC Pneumonia[0m:  0.99027, [1m[36mtrain_MCC Atelectasis[0m:  0.95919, [1m[36mtrain_MCC Pneumothorax[0m:  0.96595, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96905, [1m[36mtrain_MCC Pleural Other[0m:  0.93658, [1m[36mtrain_MCC Fracture[0m:  0.92574, [1m[36mtrain_MCC Support Devices[0m:  0.96132, [1m[36mtrain_MCC AVG[0m:  0.96108, [1m[36mtrain_Precision No Finding[0m:  0.97458, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.98958, 

100%|██████████| 149/149 [00:56<00:00,  2.62it/s]
100%|██████████| 149/149 [00:34<00:00,  4.38it/s]
100%|██████████| 16/16 [00:03<00:00,  4.05it/s]


[1m[32mepoch[0m:   47, [1m[32mseconds_training_epoch[0m: 56.8087
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.67362, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96467, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96249, [1m[36mtrain_MCC Cardiomegaly[0m:  0.97741, [1m[36mtrain_MCC Lung Opacity[0m:  0.95599, [1m[36mtrain_MCC Lung Lesion[0m:  0.96221, [1m[36mtrain_MCC Edema[0m:  0.96293, [1m[36mtrain_MCC Consolidation[0m:  0.97232, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.96136, [1m[36mtrain_MCC Pneumothorax[0m:  0.98448, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96036, [1m[36mtrain_MCC Pleural Other[0m:  0.95327, [1m[36mtrain_MCC Fracture[0m:  0.94060, [1m[36mtrain_MCC Support Devices[0m:  0.95416, [1m[36mtrain_MCC AVG[0m:  0.96168, [1m[36mtrain_Precision No Finding[0m:  0.96639, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97917, 

100%|██████████| 149/149 [00:55<00:00,  2.71it/s]
100%|██████████| 149/149 [00:35<00:00,  4.20it/s]
100%|██████████| 16/16 [00:03<00:00,  4.11it/s]


[1m[32mepoch[0m:   48, [1m[32mseconds_training_epoch[0m: 55.074
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.98168, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95508, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.93586, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96076, [1m[36mtrain_MCC Lung Opacity[0m:  0.95777, [1m[36mtrain_MCC Lung Lesion[0m:  0.97865, [1m[36mtrain_MCC Edema[0m:  0.96416, [1m[36mtrain_MCC Consolidation[0m:  0.94055, [1m[36mtrain_MCC Pneumonia[0m:  0.92253, [1m[36mtrain_MCC Atelectasis[0m:  0.95735, [1m[36mtrain_MCC Pneumothorax[0m:  0.96881, [1m[36mtrain_MCC Pleural Effusion[0m:  0.97390, [1m[36mtrain_MCC Pleural Other[0m:  1.00000, [1m[36mtrain_MCC Fracture[0m:  0.94628, [1m[36mtrain_MCC Support Devices[0m:  0.95592, [1m[36mtrain_MCC AVG[0m:  0.95840, [1m[36mtrain_Precision No Finding[0m:  0.96186, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.94845, [

100%|██████████| 149/149 [00:53<00:00,  2.79it/s]
100%|██████████| 149/149 [00:36<00:00,  4.04it/s]
100%|██████████| 16/16 [00:03<00:00,  4.14it/s]


[1m[32mepoch[0m:   49, [1m[32mseconds_training_epoch[0m: 53.4094
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.19989, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96454, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.98400, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96902, [1m[36mtrain_MCC Lung Opacity[0m:  0.94033, [1m[36mtrain_MCC Lung Lesion[0m:  0.95221, [1m[36mtrain_MCC Edema[0m:  0.96674, [1m[36mtrain_MCC Consolidation[0m:  0.94399, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.96308, [1m[36mtrain_MCC Pneumothorax[0m:  0.95357, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95939, [1m[36mtrain_MCC Pleural Other[0m:  0.95181, [1m[36mtrain_MCC Fracture[0m:  0.96636, [1m[36mtrain_MCC Support Devices[0m:  0.94874, [1m[36mtrain_MCC AVG[0m:  0.95821, [1m[36mtrain_Precision No Finding[0m:  0.97034, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  1.00000, 

100%|██████████| 149/149 [00:52<00:00,  2.86it/s]
100%|██████████| 149/149 [00:38<00:00,  3.87it/s]
100%|██████████| 16/16 [00:03<00:00,  4.01it/s]

[1m[32mepoch[0m:   50, [1m[32mseconds_training_epoch[0m: 52.032
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.18491, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.98106, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.98404, [1m[36mtrain_MCC Cardiomegaly[0m:  0.97525, [1m[36mtrain_MCC Lung Opacity[0m:  0.93574, [1m[36mtrain_MCC Lung Lesion[0m:  0.96221, [1m[36mtrain_MCC Edema[0m:  0.95579, [1m[36mtrain_MCC Consolidation[0m:  0.97570, [1m[36mtrain_MCC Pneumonia[0m:  0.95118, [1m[36mtrain_MCC Atelectasis[0m:  0.95389, [1m[36mtrain_MCC Pneumothorax[0m:  0.95616, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96905, [1m[36mtrain_MCC Pleural Other[0m:  0.95181, [1m[36mtrain_MCC Fracture[0m:  0.91220, [1m[36mtrain_MCC Support Devices[0m:  0.94602, [1m[36mtrain_MCC AVG[0m:  0.95787, [1m[36mtrain_Precision No Finding[0m:  0.98723, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.98980, [




In [None]:
# MODELS = {
#     ('effnetv2', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_effnetv2(pretrain, int(in_ch), int(out_ch))),
#     ('resnet50', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_resnet('resnet50', pretrain, int(in_ch), int(out_ch))),
#     ('resnet18', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_resnet('resnet18', pretrain, int(in_ch), int(out_ch))),
#     ('efficientnet-b0', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_efficientnetv1('efficientnet-b0', pretrain, int(in_ch), int(out_ch))),
#     ('efficientnet-b1', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_efficientnetv1('efficientnet-b1', pretrain, int(in_ch), int(out_ch))),
#     ('waveletres18', str, str, str): lambda pretrain, in_ch, out_ch: R(
#         pretrain, int(in_ch), int(out_ch)),
#     ('waveletmlp', str, str, str, str, str, str, str): (
#         lambda mlp_channels, in_ch, out_ch, wavelet_levels, patch_size, in_ch_mul, mlp_depth: get_DeepFixEnd2End(
#             int(in_ch), int(out_ch),
#             in_ch_multiplier=int(in_ch_mul), wavelet='db1',
#             wavelet_levels=int(wavelet_levels), wavelet_patch_size=int(patch_size),
#             mlp_depth=int(mlp_depth), mlp_channels=int(mlp_channels),
#             mlp_fix_weights='none', mlp_activation=None)
#         ),

#     #  ('waveletres18v2', str, str, str): lambda pretrain, in_ch, out_ch: (
#         #  DeepFixCompression(levels=8, wavelet='coif1', patch_size=1),
#         #  R2(pretrain, int(in_ch), int(out_ch))),
# }


# class R(T.nn.Module):
#     def __init__(self, pretrain, in_ch, out_ch):
#         super().__init__()
#         self.r = get_resnet('resnet18', pretrain, in_ch, out_ch,)
#         self.dwt = pyw.DWT(J=8, wave='coif1', mode='zero')

#     @staticmethod
#     def wavelet_coefficients_as_tensorimage(approx, detail, normalize=False):
#         B,C = approx.shape[:2]
#         fixed_dims = approx.shape[:-2] # num images in minibatch, num channels, etc
#         output_shape = fixed_dims + (
#             detail[0].shape[-2]*2,  # input img height
#             detail[0].shape[-1]*2)  # input img width
#         im = T.zeros(output_shape, device=approx.device, dtype=approx.dtype)
#         if normalize:
#             norm11 = lambda x: (x / max(x.min()*-1, x.max()))  # into [-1,+1] preserving sign
#             #  approx = norm11(approx)
#         im[..., :approx.shape[-2], :approx.shape[-1]] = approx if approx is not None else 0
#         for level in detail:
#             lh, hl, hh = level.unbind(-3)
#             h,w = lh.shape[-2:]
#             if normalize:
#                 lh, hl, hh = [norm11(x) for x in [lh, hl, hh]]
#             #  im[:h, :w] = approx
#             im[..., 0:h, w:w+w] = lh  # horizontal
#             im[..., h:h+h, :w] = hl  # vertical
#             im[..., h:h+h, w:w+w] = hh  # diagonal
#         return im

#     def forward(self, x):
#         x = self.wavelet_coefficients_as_tensorimage(*self.dwt(x))
#         return self.r(x)


# class R2(T.nn.Module):
#     def __init__(self, pretrain, in_ch, out_ch):
#         super().__init__()
#         self.r = get_resnet('resnet18', pretrain, in_ch, out_ch,)

#     def forward(self, x):
#         B,C,H = x.shape
#         x = x.unsqueeze(-1).repeat(1,1,1,H)
#         return self.r(x)


# class LossCheXpertIdentity(T.nn.Module):
#     def __init__(self, N):
#         super().__init__()
#         self.bce = T.nn.BCEWithLogitsLoss()
#         self.N = N

#     def forward(self, yhat, y):
#         # absolute max possible num patients in chexpert is 223414
#         # but let's just hash them into a smaller number of bins via modulo N
#         assert self.N == yhat.shape[1], \
#                 f'note: model must have {self.N} binary predictions per sample'
#         y_onehot = y.new_zeros(y.shape[0], self.N, dtype=T.float
#                                ).scatter_(1, y.long()%self.N, 1)
#         return self.bce(yhat[:, -1], y_onehot[:, -1])


# class LossCheXpertUignore(T.nn.Module):
#     def __init__(self):
#         super().__init__()
#         self.bce = T.nn.BCEWithLogitsLoss()

#     def forward(self, yhat, y):
#         ignore = (y != 2)  # ignore uncertainty labels
#         return self.bce(yhat[ignore], y[ignore])


# def loss_intelmobileodt(yhat, y):
#     """BCE Loss with class balancing weights.

#     Not sure this actually helps

#     because Type 2 is the hardest class, it
#     has the most samples, and it separates Type 1 from Type 3.  Arguably, Type 2
#     samples are on the decision boundary between Type 1 and 3.
#     Class balancing weights make it harder to focus on class 2.
#     """
#     #  assert y.shape == yhat.shape, 'sanity check'
#     #  assert y.dtype == yhat.dtype, 'sanity check'

#     # class distribution of stage='train'
#     w = T.tensor([249, 781, 450], dtype=y.dtype, device=y.device)
#     w = (w.max() / w).reshape(1, 3)
#     # w can have any of the shapes:  (B,1) or (1,C) or (B,C)
#     #  return T.nn.functional.binary_cross_entropy_with_logits(yhat, y, weight=w)
#     return T.nn.functional.cross_entropy(yhat, y, weight=w)
#     # can't apply focal loss unless do it manually.


# def onehot(y, nclasses):
#     return T.zeros((y.numel(), nclasses), dtype=y.dtype, device=y.device)\
#             .scatter_(1, y.unsqueeze(1), 1)


# def _upsample_pad_minibatch_imgs_to_same_size(batch, target_is_segmentation_mask=False):
#     """a collate function for a dataloader of (x,y) samples.  """
#     shapes = [item[0].shape for item in batch]
#     H = max(h for c,h,w in shapes)
#     W = max(w for c,h,w in shapes)
#     X, Y = [], []
#     for item in batch:
#         h,w = item[0].shape[1:]
#         dh, dw = (H-h), (W-w)
#         padding = (dw//2, dw-dw//2, dh//2, dh-dh//2, )
#         X.append(T.nn.functional.pad(item[0], padding))
#         if target_is_segmentation_mask:
#             Y.append(T.nn.functional.pad(item[1], padding))
#         else:
#             Y.append(item[1])
#     return T.stack(X), T.stack(Y)


# def get_dset_chexpert(train_frac=.8, val_frac=.2, small=False,
#                       labels:str='diagnostic', num_identities=None):
#     """
#     Args:
#         labels:  either "diagnostic" (the 14 classes defined as
#             D.CheXpert.LABELS_DIAGNOSTIC) or "identity" ("patient", "study",
#             "view", "index")
#         small:  whether to use CheXpert_Small dataset (previously downsampled
#             images) or the fully size dataset.
#         num_identities:  used only if labels='identity'.  If
#             num_identities=1000, then all patients get identified as coming
#             from precisely 1 of 1000 bins.

#     Returns:
#         (
#         {'train_dset': ..., 'val_dset': ..., 'test_dset': ...,
#          'train_loader': ..., 'val_loader': ..., 'test_loader': ...
#          },

#         ('Pneumonia', 'Cardiomegaly', ...)  # class names defined by `labels`
#         )
#     """
#     _label_cleanup_dct = dict(D.CheXpert.LABEL_CLEANUP_DICT)
#     if labels == 'diagnostic':
#         class_names = D.CheXpert.LABELS_DIAGNOSTIC
#         for k in class_names:
#             _label_cleanup_dct[k][np.nan] = 0  # remap missing value to negative
#         get_ylabels = lambda dct: \
#                 D.CheXpert.format_labels(dct, labels=class_names).float()
#     elif labels == 'identity':
#         class_names = list(range(num_identities))
#         get_ylabels = lambda dct: \
#                 (D.CheXpert.format_labels(dct, labels=['index']) % num_identities).long()
#     else:
#         raise NotImplementedError(f"unrecognized labels: {labels}")
#     kws = dict(
#         img_transform=tvt.Compose([
#             #  tvt.RandomCrop((512, 512)),
#             tvt.ToTensor(),  # full res 1024x1024 imgs
#         ]),
#         getitem_transform=lambda dct: (dct['image'], get_ylabels(dct)),
#         label_cleanup_dct=_label_cleanup_dct,
#     )
#     if small:
#         kls = D.CheXpert_Small
#     else:
#         kls = D.CheXpert

#     train_dset = kls(dataset_dir="../data/CheXpert-v1.0-small/",use_train_set=True, **kws)  #Edited Elvin

#     N = len(train_dset)
#     if train_frac + val_frac == 1:
#         nsplits = [N - int(N*val_frac), int(N*val_frac), 0]
#     else:
#         a,b = int(N*train_frac), int(N*val_frac)
#         nsplits = [a,b, N-a-b]
#     train_dset, val_dset, _ = T.utils.data.random_split(train_dset, nsplits)
#     test_dset = kls(dataset_dir="../data/CheXpert-v1.0-small/",use_train_set=False, **kws) #Edited Elvin
#     batch_dct = dict(
#         batch_size=15, collate_fn=_upsample_pad_minibatch_imgs_to_same_size,
#         num_workers=int(os.environ.get("num_workers", 4)))  # upsample pad must take time
#     train_loader=DataLoader(train_dset, shuffle=True, **batch_dct)
#     val_loader=DataLoader(val_dset, **batch_dct)
#     test_loader=DataLoader(test_dset, **batch_dct)
#     return (dict(
#         train_dset=train_dset, val_dset=val_dset, test_dset=test_dset,
#         train_loader=train_loader, val_loader=val_loader, test_loader=test_loader,
#     ), class_names)


# def get_dset_intel_mobileodt(stage_trainval:str, use_val:str, stage_test:str, augment:str
#                              ) -> (dict[str,Optional[Union[Dataset,DataLoader]]], tuple[str]):
#     """Obtain train/val/test splits for the IntelMobileODT Cervical Cancer
#     Colposcopy dataset, and the data loaders.

#     Args:
#         stage_trainval: the `stage` for training and validation.
#             i.e. Possible choices:  {'train', 'train+additional'}
#             Train / val split is 70/30 random stratified split.
#         use_val: Whether to create a validation set
#             Choices:  {"val", "noval"}
#         stage_test: the `stage` for test set.  Should be "test".
#         augment: Type of augmentations to apply.  One of {'v1', }.
#             "v1" - make the aspect ratio .75, resize images to (200,150), and convert in range [0,1]
#     Returns:
#         (
#         {'train_dset': ..., 'val_dset': ..., 'test_dset': ...,
#          'train_loader': ..., 'val_loader': ..., 'test_loader': ...
#          },

#         ('Type 1', 'Type 2', 'Type 3')
#         )
#     """
#     assert augment == 'v1', 'code bug: other augmentations not implemented'
#     base_dir = './data/intel_mobileodt_cervical_resized'
#     dset_trainval = D.IntelMobileODTCervical(stage_trainval, base_dir)
#     _y = [dset_trainval.getitem(i, load_img=False)
#           for i in range(len(dset_trainval))]
#     dct = {'test_dset': D.IntelMobileODTCervical(stage_test, base_dir)}
#     if use_val == 'noval':
#         dct['train_dset'] = dset_trainval
#         dct['val_dset'] = None
#     else:
#         assert use_val == 'val', f'unrecognized option: {use_val}'
#         idxs_train, idxs_val = list(
#             StratifiedShuffleSplit(1, test_size=.3).split(
#                 np.arange(len(dset_trainval)), _y))[0]
#         dct['train_dset'] = T.utils.data.Subset(dset_trainval, idxs_train)
#         dct['val_dset'] = T.utils.data.Subset(dset_trainval, idxs_val)

#     # preprocess train/val/test images all the same way
#     preprocess_v1 = tvt.Compose([
#         #
#         ### previously done (to save computation time) ###
#         #  D.IntelMobileODTCervical.fix_aspect_ratio,
#         #  tvt.Resize((200, 150)),  # interpolation=tvt.InterpolationMode.NEAREST),
#         #
#         lambda x: x.float()/255.
#     ])
#     dct = {k: D.PreProcess(v, lambda xy: (
#         preprocess_v1(xy[0]),
#         #  onehot(xy[1].unsqueeze(0).long()-1, 3).squeeze_().float()))
#         xy[1].long()-1))
#         for k,v in dct.items()}
#     dct.update(dict(
#         train_loader=DataLoader(dct['train_dset'], batch_size=20, shuffle=True),
#         test_loader=DataLoader(dct['test_dset'], batch_size=20),))
#     if dct['val_dset'] is None:
#         dct['val_loader'] = None
#     else:
#         dct['val_loader'] = DataLoader(dct['val_dset'], batch_size=20)
#     class_names = [x.replace('_', ' ') for x in D.IntelMobileODTCervical.LABEL_NAMES]
#     return dct, class_names


# LOSS_FNS = {
#     ('BCEWithLogitsLoss', ): lambda _: T.nn.BCEWithLogitsLoss(),
#     ('CrossEntropyLoss', ): lambda _: T.nn.CrossEntropyLoss(),
#     ('CE_intelmobileodt', ): lambda _: loss_intelmobileodt,
#     ('chexpert_uignore', ): lambda _: LossCheXpertUignore(),
#     ('chexpert_identity', str): lambda out_ch: LossCheXpertIdentity(N=int(out_ch)),
# }

# DSETS = {
#     ('intel_mobileodt', str, str, str, str): (
#         lambda train, val, test, aug: get_dset_intel_mobileodt(train, val, test, aug)),
#     #  ('origa', ... todo): ( lambda ...: get_dset_origa(...)
#     #  ('riga', ... todo): ( lambda ...: get_dset_riga(...)
#     ('chexpert', str, str): (
#         lambda train_frac, val_frac: get_dset_chexpert(
#             float(train_frac), float(val_frac), small=False, labels='diagnostic')),
#     ('chexpert_small', str, str): (
#         lambda train_frac, val_frac: get_dset_chexpert(
#             float(train_frac), float(val_frac), small=True, labels='diagnostic')),
#     ('chexpert_small_ID', str, str, str): (
#         lambda num_identities, train_frac, val_frac: get_dset_chexpert(
#             float(train_frac), float(val_frac), small=True,
#             labels='identity', num_identities=int(num_identities))),
# }


# def match(spec:str, dct:dict):
#     return pampy.match(spec.split(':'), *(x for y in dct.items() for x in y))


# def get_model_opt_loss(
#         model_spec:str, opt_spec:str, loss_spec:str, regularizer_spec:str,
#         device:str) -> dict[str, Union[T.nn.Module, T.optim.Optimizer]]:
#     """
#     Args:
#         model_spec: a string of form,
#             "model_name:pretraining:in_channels:out_classes".  For example:
#             "effnetv2:untrained:1:5"
#         opt_spec: Specifies how to create optimizer.
#             First value is a pytorch Optimizer in T.optim.*.
#             Other values are numerical parameters.
#             Example: "SGD:lr=.003:momentum=.9"
#         device: e.g. 'cpu' or 'gpu'
#     Returns:
#         a pytorch model and optimizer
#     """
#     mdl = match(model_spec, MODELS)
#     mdl = mdl.to(device, non_blocking=True)
#     optimizer = reset_optimizer(opt_spec, mdl)
#     loss_fn = match(loss_spec, LOSS_FNS)
#     if regularizer_spec != 'none':
#         loss_fn = RegularizedLoss(mdl, loss_fn, regularizer_spec)
#     return dict(model=mdl, optimizer=optimizer, loss_fn=loss_fn)


# class RegularizedLoss(T.nn.Module):
#     def __init__(self, model, lossfn, regularizer_spec:str):
#         super().__init__()
#         self.lossfn = lossfn
#         self.regularizer_spec = regularizer_spec
#         if regularizer_spec == 'none':
#             self.regularizer = lambda *y: 0
#         elif regularizer_spec.startswith('deepfixmlp:'):
#             lbda = float(regularizer_spec.split(':')[1])
#             self.regularizer = lambda *y: (
#                 float(lbda) * DeepFixMLP.get_VecAttn_regularizer(model))
#         else:
#             raise NotImplementedError(regularizer_spec)

#     def forward(self, yhat, y):
#         return self.lossfn(yhat, y) + self.regularizer(yhat, y)

#     def __repr__(self):
#         return f'RegularizedLoss<{repr(self.lossfn)},{self.regularizer_spec}>'


# def get_dset_loaders_resultfactory(dset_spec:str) -> dict:
#     dct, class_names = match(dset_spec, DSETS)
#     if any(dset_spec.startswith(x) for x in {'intel_mobileodt:',
#                                              'chexpert_small_ID:'}):
#         #  dct['result_factory'] = lambda: TL.MultiLabelBinaryClassification(
#                 #  class_names, binarize_fn=lambda yh: (T.sigmoid(yh)>.5).long())
#         dct['result_factory'] = lambda: TL.MultiClassClassification(
#                 len(class_names), binarize_fn=lambda yh: yh.softmax(1).argmax(1))
#     elif any(dset_spec.startswith(x) for x in {'chexpert:', 'chexpert_small:'}):
#         dct['result_factory'] = lambda: CheXpertMultiLabelBinaryClassification(
#             class_names, binarize_fn=lambda yh: (yh.sigmoid()>.5).long(), report_avg=True)
#     else:
#         raise NotImplementedError(f"I don't know how to create the result factory for {dset_spec}")
#     return dct

# class CheXpertMultiLabelBinaryClassification(TL.MultiLabelBinaryClassification):
#     def update(self, yhat, y, loss) -> None:
#         self.num_samples += yhat.shape[0]
#         self.loss += loss.item()
#         assert yhat.shape == y.shape
#         assert yhat.ndim == 2 and yhat.shape[1] == len(self._cms), "sanity check: model outputs expected prediction shape"
#         binarized = self._binarize_fn(yhat)
#         assert binarized.dtype == T.long, 'sanity check binarize fn'
#         assert binarized.shape == y.shape, 'sanity check binarize fn'
#         ignore = (y != 2)  # ignore uncertainty labels
#         for i, (kls, cm) in enumerate(self._cms.items()):
#             rows = ignore[:, i]
#             if rows.sum() == 0:
#                 continue  # don't update a confusion matrix if all data for this class is ignored
#             cm += metrics.confusion_matrix(y[rows, i], binarized[rows, i], num_classes=2).cpu()


# def get_deepfix_train_strategy(args:'TrainOptions'):
#     deepfix_spec = args.deepfix
#     if deepfix_spec == 'off':
#         return TL.train_one_epoch
#     elif deepfix_spec.startswith('reinit:'):
#         _, N, P, R = deepfix_spec.split(':')
#         return dfs.DeepFix_TrainOneEpoch(int(N), float(P), int(R), TL.train_one_epoch)
#     elif deepfix_spec.startswith('dhist:'):
#         fp = deepfix_spec.split(':', 1)[1]
#         assert exists(fp), f'histogram file not found: {fp}'
#         return dfs.DeepFix_DHist(fp)
#     elif deepfix_spec.startswith('dfhist:'):
#         fp = deepfix_spec.split(':', 1)[1]
#         assert exists(fp), f'histogram file not found: {fp}'
#         return dfs.DeepFix_DHist(fp, fixed=True)
#     elif deepfix_spec == 'fixed':
#         return dfs.DeepFix_DHist('', fixed=True, init_with_hist=False)
#     elif deepfix_spec.startswith('beta:'):
#         alpha, beta = deepfix_spec.split(':')[1:]
#         return dfs.DeepFix_LambdaInit(
#             lambda cfg: init_from_beta(cfg.model, float(alpha), float(beta)))
#     elif deepfix_spec.startswith('ghaarconv2d:'):
#         ignore_layers = deepfix_spec.split(':')[1].split(',')
#         return dfs.DeepFix_LambdaInit(
#             lambda cfg: (
#                 print(f'initialize {deepfix_spec}'),
#                 convert_conv2d_to_gHaarConv2d(cfg.model, ignore_layers=ignore_layers),
#                 reset_optimizer(args.opt, cfg.model),
#                 print(cfg.model)
#             ))
#     else:
#         raise NotImplementedError(deepfix_spec)


# def train_config(args:'TrainOptions') -> TL.TrainConfig:
#     return TL.TrainConfig(
#         **get_model_opt_loss(
#             args.model, args.opt, args.lossfn, args.loss_reg, args.device),
#         **get_dset_loaders_resultfactory(args.dset),
#         device=args.device,
#         epochs=args.epochs,
#         start_epoch=args.start_epoch,
#         train_one_epoch=get_deepfix_train_strategy(args),
#         experiment_id=args.experiment_id,
#     )


# @dc.dataclass
# class TrainOptions:
#     """High-level configuration for training PyTorch models
#     on the IntelMobileODTCervical dataset.
#     """
#     epochs:int = 50
#     start_epoch:int = 0  # if "--start_epoch 1", then don't evaluate perf before training.
#     device:str = 'cuda' if T.cuda.is_available() else 'cpu'
#     dset:str = None #choice(
#         #  'intel_mobileodt:train:val:test:v1',
#         #  'intel_mobileodt:train+additional:val:test:v1',
#         #  'intel_mobileodt:train+additional:noval:test:v1',
#         #  'chexpert:.8:.2', 'chexpert:.01:.01', 'chexpert:.001:.001',
#         #  'chexpert_small:.8:.2', 'chexpert_small:.01:.01',
#         #   'chexpert_small:.001:.001',
#         #  default='intel_mobileodt:train:val:test:v1')
#     opt:str = 'SGD:lr=.001:momentum=.9:nesterov=1'
#     lossfn:str = None  # choices:
#         #  'BCEWithLogitsLoss',
#         #  'CrossEntropyLoss', 
#         #  'CE_intelmobileodt',
#         #  'chexpert_uignore', 
#         #  'chexpert_identity:N' for some N=num_identities predicted by model (compared to identities y%N)
#     loss_reg:str = 'none'  # Optionally add a regularizer to the loss.  loss + reg.  Accepted values:  'none', 'deepfixmlp:X' where X is a positive float denoting the lambda in l1 regularizer
#     model:str = 'resnet18:imagenet:3:3'  # Model specification adheres to the template "model_name:pretraining:in_ch:out_ch"
#     deepfix:str = 'off'  # DeepFix Re-initialization Method.
#                          #  "off" or "reinit:N:P:R" or "d[f]hist:path_to_histogram.pth"
#                          #  or "beta:A:B" for A,B as (float) parameters of the beta distribution
#                          # 'ghaarconv2d:layer1,layer2' Replaces all spatial convolutions with GHaarConv2d layer except the specified layers
#     experiment_id:str = os.environ.get('run_id', 'debugging')
#     prune:str = 'off'

#     def execute(self):
#         cfg = train_config(self)
#         cfg.train(cfg)


# def main():
#     p = ArgumentParser()
#     p.add_arguments(TrainOptions, dest='TrainOptions')

# #     args = p.parse_args(["--dset", "chexpert_small:.01:.01", "--opt", "Adam:lr=0.001", "--lossfn", "chexpert_uignore", "--model", "waveletmlp:300:1:14:7:1:1:2", "--loss_reg", "none"]).TrainOptions

#     print(args)
#     cfg = train_config(args)
    
# # python deepfix/train.py --dset chexpert_small:.01:.01 --opt Adam:lr=0.001 --lossfn chexpert_uignore --model waveletmlp:300:1:14:7:1:1:2 --loss_reg none    
    
#     if args.prune != 'off':
#         assert args.prune.startswith('ChannelPrune:')
#         raise NotImplementedError('code is a bit hardcoded, so it is not available without hacking on it.')
#         print(args.prune)
#         from explainfix import channelprune
#         from deepfix.weight_saliency import costfn_multiclass
#         a = sum([x.numel() for x in cfg.model.parameters()])
#         channelprune(cfg.model, pct=5, grad_cost_fn=costfn_multiclass,
#                      loader=cfg.train_loader, device=cfg.device, num_minibatches=10)
#         b = sum([x.numel() for x in cfg.model.parameters()])
#         assert a/b != 1
#         print(f'done channelpruning.  {a/b}')

#     cfg.train(cfg)
#     #  import IPython ; IPython.embed() ; import sys ; sys.exit()

#     #  with T.profiler.profile(
#     #      activities=[
#     #          T.profiler.ProfilerActivity.CPU,
#     #          T.profiler.ProfilerActivity.CUDA,
#     #      ], with_modules=True,
#     #  ) as p:
#     #      cfg.train(cfg)
#     #  print(p.key_averages().table(
#     #      sort_by="self_cuda_time_total", row_limit=-1))


# if __name__ == "__main__":
#     main()


In [4]:
# os.getcwd()
# !ls

In [4]:
# args = {}
# args['dset'] = 'chexpert_small:.01:.01'
# args['opt'] = 'Adam:lr=0.001'
# args['lossfn'] = 'chexpert_uignore'
# args['model'] = 'waveletmlp:300:1:14:7:1:1:2'
# args['loss_reg'] = None
# args['prune'] = 'off'

In [9]:
# args.dset

In [21]:
# import pandas as pd

In [23]:
# t = pd.read_csv('../data/CheXpert-v1.0-small/train.csv')