In [1]:
"""
Boilerplate to implement training different networks on different datasets
with varying config.

I wish a machine could automate setting up decent baseline models and datasets
"""
#  import json
import os
from os.path import exists
import pampy
from simple_parsing import ArgumentParser, choice
from simplepytorch import datasets as D
from simplepytorch import trainlib as TL
from simplepytorch import metrics
from sklearn.model_selection import StratifiedShuffleSplit
from torch.utils.data import Dataset, DataLoader
from typing import Union, Optional
import dataclasses as dc
import numpy as np
import torch as T
import torchvision.transforms as tvt

from deepfix.models import get_effnetv2, get_resnet, get_efficientnetv1, get_DeepFixEnd2End, DeepFixMLP
from deepfix.models.ghaarconv import convert_conv2d_to_gHaarConv2d
from deepfix.init_from_distribution import init_from_beta, reset_optimizer
from deepfix import deepfix_strategies as dfs
import pytorch_wavelets as pyw



In [2]:
MODELS = {
    ('effnetv2', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_effnetv2(pretrain, int(in_ch), int(out_ch))),
    ('resnet50', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_resnet('resnet50', pretrain, int(in_ch), int(out_ch))),
    ('resnet18', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_resnet('resnet18', pretrain, int(in_ch), int(out_ch))),
    ('efficientnet-b0', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_efficientnetv1('efficientnet-b0', pretrain, int(in_ch), int(out_ch))),
    ('efficientnet-b1', str, str, str): (
        lambda pretrain, in_ch, out_ch: get_efficientnetv1('efficientnet-b1', pretrain, int(in_ch), int(out_ch))),
    ('waveletres18', str, str, str): lambda pretrain, in_ch, out_ch: R(
        pretrain, int(in_ch), int(out_ch)),
    ('waveletmlp', str, str, str, str, str, str, str): (
        lambda mlp_channels, in_ch, out_ch, wavelet_levels, patch_size, in_ch_mul, mlp_depth: get_DeepFixEnd2End(
            int(in_ch), int(out_ch),
            in_ch_multiplier=int(in_ch_mul), wavelet='db1',
            wavelet_levels=int(wavelet_levels), wavelet_patch_size=int(patch_size),
            mlp_depth=int(mlp_depth), mlp_channels=int(mlp_channels),
            mlp_fix_weights='none', mlp_activation=None)
        ),

    #  ('waveletres18v2', str, str, str): lambda pretrain, in_ch, out_ch: (
        #  DeepFixCompression(levels=8, wavelet='coif1', patch_size=1),
        #  R2(pretrain, int(in_ch), int(out_ch))),
}


class R(T.nn.Module):
    def __init__(self, pretrain, in_ch, out_ch):
        super().__init__()
        self.r = get_resnet('resnet18', pretrain, in_ch, out_ch,)
        self.dwt = pyw.DWT(J=8, wave='coif1', mode='zero')

    @staticmethod
    def wavelet_coefficients_as_tensorimage(approx, detail, normalize=False):
        B,C = approx.shape[:2]
        fixed_dims = approx.shape[:-2] # num images in minibatch, num channels, etc
        output_shape = fixed_dims + (
            detail[0].shape[-2]*2,  # input img height
            detail[0].shape[-1]*2)  # input img width
        im = T.zeros(output_shape, device=approx.device, dtype=approx.dtype)
        if normalize:
            norm11 = lambda x: (x / max(x.min()*-1, x.max()))  # into [-1,+1] preserving sign
            #  approx = norm11(approx)
        im[..., :approx.shape[-2], :approx.shape[-1]] = approx if approx is not None else 0
        for level in detail:
            lh, hl, hh = level.unbind(-3)
            h,w = lh.shape[-2:]
            if normalize:
                lh, hl, hh = [norm11(x) for x in [lh, hl, hh]]
            #  im[:h, :w] = approx
            im[..., 0:h, w:w+w] = lh  # horizontal
            im[..., h:h+h, :w] = hl  # vertical
            im[..., h:h+h, w:w+w] = hh  # diagonal
        return im

    def forward(self, x):
        x = self.wavelet_coefficients_as_tensorimage(*self.dwt(x))
        return self.r(x)


class R2(T.nn.Module):
    def __init__(self, pretrain, in_ch, out_ch):
        super().__init__()
        self.r = get_resnet('resnet18', pretrain, in_ch, out_ch,)

    def forward(self, x):
        B,C,H = x.shape
        x = x.unsqueeze(-1).repeat(1,1,1,H)
        return self.r(x)


class LossCheXpertIdentity(T.nn.Module):
    def __init__(self, N):
        super().__init__()
        self.bce = T.nn.BCEWithLogitsLoss()
        self.N = N

    def forward(self, yhat, y):
        # absolute max possible num patients in chexpert is 223414
        # but let's just hash them into a smaller number of bins via modulo N
        assert self.N == yhat.shape[1], \
                f'note: model must have {self.N} binary predictions per sample'
        y_onehot = y.new_zeros(y.shape[0], self.N, dtype=T.float
                               ).scatter_(1, y.long()%self.N, 1)
        return self.bce(yhat[:, -1], y_onehot[:, -1])


class LossCheXpertUignore(T.nn.Module):
    def __init__(self):
        super().__init__()
        self.bce = T.nn.BCEWithLogitsLoss()

    def forward(self, yhat, y):
        ignore = (y != 2)  # ignore uncertainty labels
        return self.bce(yhat[ignore], y[ignore])


def loss_intelmobileodt(yhat, y):
    """BCE Loss with class balancing weights.

    Not sure this actually helps

    because Type 2 is the hardest class, it
    has the most samples, and it separates Type 1 from Type 3.  Arguably, Type 2
    samples are on the decision boundary between Type 1 and 3.
    Class balancing weights make it harder to focus on class 2.
    """
    #  assert y.shape == yhat.shape, 'sanity check'
    #  assert y.dtype == yhat.dtype, 'sanity check'

    # class distribution of stage='train'
    w = T.tensor([249, 781, 450], dtype=y.dtype, device=y.device)
    w = (w.max() / w).reshape(1, 3)
    # w can have any of the shapes:  (B,1) or (1,C) or (B,C)
    #  return T.nn.functional.binary_cross_entropy_with_logits(yhat, y, weight=w)
    return T.nn.functional.cross_entropy(yhat, y, weight=w)
    # can't apply focal loss unless do it manually.


def onehot(y, nclasses):
    return T.zeros((y.numel(), nclasses), dtype=y.dtype, device=y.device)\
            .scatter_(1, y.unsqueeze(1), 1)


def _upsample_pad_minibatch_imgs_to_same_size(batch, target_is_segmentation_mask=False):
    """a collate function for a dataloader of (x,y) samples.  """
    shapes = [item[0].shape for item in batch]
    H = max(h for c,h,w in shapes)
    W = max(w for c,h,w in shapes)
    X, Y = [], []
    for item in batch:
        h,w = item[0].shape[1:]
        dh, dw = (H-h), (W-w)
        padding = (dw//2, dw-dw//2, dh//2, dh-dh//2, )
        X.append(T.nn.functional.pad(item[0], padding))
        if target_is_segmentation_mask:
            Y.append(T.nn.functional.pad(item[1], padding))
        else:
            Y.append(item[1])
    return T.stack(X), T.stack(Y)


def get_dset_chexpert(train_frac=.8, val_frac=.2, small=False,
                      labels:str='diagnostic', num_identities=None):
    """
    Args:
        labels:  either "diagnostic" (the 14 classes defined as
            D.CheXpert.LABELS_DIAGNOSTIC) or "identity" ("patient", "study",
            "view", "index")
        small:  whether to use CheXpert_Small dataset (previously downsampled
            images) or the fully size dataset.
        num_identities:  used only if labels='identity'.  If
            num_identities=1000, then all patients get identified as coming
            from precisely 1 of 1000 bins.

    Returns:
        (
        {'train_dset': ..., 'val_dset': ..., 'test_dset': ...,
         'train_loader': ..., 'val_loader': ..., 'test_loader': ...
         },

        ('Pneumonia', 'Cardiomegaly', ...)  # class names defined by `labels`
        )
    """
    _label_cleanup_dct = dict(D.CheXpert.LABEL_CLEANUP_DICT)
    if labels == 'diagnostic':
        class_names = D.CheXpert.LABELS_DIAGNOSTIC
        for k in class_names:
            _label_cleanup_dct[k][np.nan] = 0  # remap missing value to negative
        get_ylabels = lambda dct: \
                D.CheXpert.format_labels(dct, labels=class_names).float()
    elif labels == 'identity':
        class_names = list(range(num_identities))
        get_ylabels = lambda dct: \
                (D.CheXpert.format_labels(dct, labels=['index']) % num_identities).long()
    else:
        raise NotImplementedError(f"unrecognized labels: {labels}")
    kws = dict(
        img_transform=tvt.Compose([
#              tvt.RandomCrop((512, 512)),
            tvt.ToTensor(),  # full res 1024x1024 imgs
        ]),
        getitem_transform=lambda dct: (dct['image'], get_ylabels(dct)),
        label_cleanup_dct=_label_cleanup_dct,
    )
    if small:
        kls = D.CheXpert_Small
    else:
        kls = D.CheXpert

    train_dset = kls(dataset_dir="../data/CheXpert-v1.0-small/",use_train_set=True, **kws)  #Edited Elvin

    N = len(train_dset)
    if train_frac + val_frac == 1:
        nsplits = [N - int(N*val_frac), int(N*val_frac), 0]
    else:
        a,b = int(N*train_frac), int(N*val_frac)
        nsplits = [a,b, N-a-b]
    train_dset, val_dset, _ = T.utils.data.random_split(train_dset, nsplits)
    test_dset = kls(dataset_dir="../data/CheXpert-v1.0-small/",use_train_set=False, **kws) #Edited Elvin
    batch_dct = dict(
        batch_size=15, collate_fn=_upsample_pad_minibatch_imgs_to_same_size,
        num_workers=int(os.environ.get("num_workers", 4)))  # upsample pad must take time
    train_loader=DataLoader(train_dset, shuffle=True, **batch_dct)
    val_loader=DataLoader(val_dset, **batch_dct)
    test_loader=DataLoader(test_dset, **batch_dct)
    return (dict(
        train_dset=train_dset, val_dset=val_dset, test_dset=test_dset,
        train_loader=train_loader, val_loader=val_loader, test_loader=test_loader,
    ), class_names)


def get_dset_intel_mobileodt(stage_trainval:str, use_val:str, stage_test:str, augment:str
                             ) -> (dict[str,Optional[Union[Dataset,DataLoader]]], tuple[str]):
    """Obtain train/val/test splits for the IntelMobileODT Cervical Cancer
    Colposcopy dataset, and the data loaders.

    Args:
        stage_trainval: the `stage` for training and validation.
            i.e. Possible choices:  {'train', 'train+additional'}
            Train / val split is 70/30 random stratified split.
        use_val: Whether to create a validation set
            Choices:  {"val", "noval"}
        stage_test: the `stage` for test set.  Should be "test".
        augment: Type of augmentations to apply.  One of {'v1', }.
            "v1" - make the aspect ratio .75, resize images to (200,150), and convert in range [0,1]
    Returns:
        (
        {'train_dset': ..., 'val_dset': ..., 'test_dset': ...,
         'train_loader': ..., 'val_loader': ..., 'test_loader': ...
         },

        ('Type 1', 'Type 2', 'Type 3')
        )
    """
    assert augment == 'v1', 'code bug: other augmentations not implemented'
    base_dir = './data/intel_mobileodt_cervical_resized'
    dset_trainval = D.IntelMobileODTCervical(stage_trainval, base_dir)
    _y = [dset_trainval.getitem(i, load_img=False)
          for i in range(len(dset_trainval))]
    dct = {'test_dset': D.IntelMobileODTCervical(stage_test, base_dir)}
    if use_val == 'noval':
        dct['train_dset'] = dset_trainval
        dct['val_dset'] = None
    else:
        assert use_val == 'val', f'unrecognized option: {use_val}'
        idxs_train, idxs_val = list(
            StratifiedShuffleSplit(1, test_size=.3).split(
                np.arange(len(dset_trainval)), _y))[0]
        dct['train_dset'] = T.utils.data.Subset(dset_trainval, idxs_train)
        dct['val_dset'] = T.utils.data.Subset(dset_trainval, idxs_val)

    # preprocess train/val/test images all the same way
    preprocess_v1 = tvt.Compose([
        #
        ### previously done (to save computation time) ###
        #  D.IntelMobileODTCervical.fix_aspect_ratio,
        #  tvt.Resize((200, 150)),  # interpolation=tvt.InterpolationMode.NEAREST),
        #
        lambda x: x.float()/255.
    ])
    dct = {k: D.PreProcess(v, lambda xy: (
        preprocess_v1(xy[0]),
        #  onehot(xy[1].unsqueeze(0).long()-1, 3).squeeze_().float()))
        xy[1].long()-1))
        for k,v in dct.items()}
    dct.update(dict(
        train_loader=DataLoader(dct['train_dset'], batch_size=20, shuffle=True),
        test_loader=DataLoader(dct['test_dset'], batch_size=20),))
    if dct['val_dset'] is None:
        dct['val_loader'] = None
    else:
        dct['val_loader'] = DataLoader(dct['val_dset'], batch_size=20)
    class_names = [x.replace('_', ' ') for x in D.IntelMobileODTCervical.LABEL_NAMES]
    return dct, class_names


LOSS_FNS = {
    ('BCEWithLogitsLoss', ): lambda _: T.nn.BCEWithLogitsLoss(),
    ('CrossEntropyLoss', ): lambda _: T.nn.CrossEntropyLoss(),
    ('CE_intelmobileodt', ): lambda _: loss_intelmobileodt,
    ('chexpert_uignore', ): lambda _: LossCheXpertUignore(),
    ('chexpert_identity', str): lambda out_ch: LossCheXpertIdentity(N=int(out_ch)),
}

DSETS = {
    ('intel_mobileodt', str, str, str, str): (
        lambda train, val, test, aug: get_dset_intel_mobileodt(train, val, test, aug)),
    #  ('origa', ... todo): ( lambda ...: get_dset_origa(...)
    #  ('riga', ... todo): ( lambda ...: get_dset_riga(...)
    ('chexpert', str, str): (
        lambda train_frac, val_frac: get_dset_chexpert(
            float(train_frac), float(val_frac), small=False, labels='diagnostic')),
    ('chexpert_small', str, str): (
        lambda train_frac, val_frac: get_dset_chexpert(
            float(train_frac), float(val_frac), small=True, labels='diagnostic')),
    ('chexpert_small_ID', str, str, str): (
        lambda num_identities, train_frac, val_frac: get_dset_chexpert(
            float(train_frac), float(val_frac), small=True,
            labels='identity', num_identities=int(num_identities))),
}


def match(spec:str, dct:dict):
    return pampy.match(spec.split(':'), *(x for y in dct.items() for x in y))


def get_model_opt_loss(
        model_spec:str, opt_spec:str, loss_spec:str, regularizer_spec:str,
        device:str) -> dict[str, Union[T.nn.Module, T.optim.Optimizer]]:
    """
    Args:
        model_spec: a string of form,
            "model_name:pretraining:in_channels:out_classes".  For example:
            "effnetv2:untrained:1:5"
        opt_spec: Specifies how to create optimizer.
            First value is a pytorch Optimizer in T.optim.*.
            Other values are numerical parameters.
            Example: "SGD:lr=.003:momentum=.9"
        device: e.g. 'cpu' or 'gpu'
    Returns:
        a pytorch model and optimizer
    """
    mdl = match(model_spec, MODELS)
    mdl = mdl.to(device, non_blocking=True)
    optimizer = reset_optimizer(opt_spec, mdl)
    loss_fn = match(loss_spec, LOSS_FNS)
    if regularizer_spec != 'none':
        loss_fn = RegularizedLoss(mdl, loss_fn, regularizer_spec)
    return dict(model=mdl, optimizer=optimizer, loss_fn=loss_fn)


class RegularizedLoss(T.nn.Module):
    def __init__(self, model, lossfn, regularizer_spec:str):
        super().__init__()
        self.lossfn = lossfn
        self.regularizer_spec = regularizer_spec
        if regularizer_spec == 'none':
            self.regularizer = lambda *y: 0
        elif regularizer_spec.startswith('deepfixmlp:'):
            lbda = float(regularizer_spec.split(':')[1])
            self.regularizer = lambda *y: (
                float(lbda) * DeepFixMLP.get_VecAttn_regularizer(model))
        else:
            raise NotImplementedError(regularizer_spec)

    def forward(self, yhat, y):
        return self.lossfn(yhat, y) + self.regularizer(yhat, y)

    def __repr__(self):
        return f'RegularizedLoss<{repr(self.lossfn)},{self.regularizer_spec}>'


def get_dset_loaders_resultfactory(dset_spec:str) -> dict:
    dct, class_names = match(dset_spec, DSETS)
    if any(dset_spec.startswith(x) for x in {'intel_mobileodt:',
                                             'chexpert_small_ID:'}):
        #  dct['result_factory'] = lambda: TL.MultiLabelBinaryClassification(
                #  class_names, binarize_fn=lambda yh: (T.sigmoid(yh)>.5).long())
        dct['result_factory'] = lambda: TL.MultiClassClassification(
                len(class_names), binarize_fn=lambda yh: yh.softmax(1).argmax(1))
    elif any(dset_spec.startswith(x) for x in {'chexpert:', 'chexpert_small:'}):
        dct['result_factory'] = lambda: CheXpertMultiLabelBinaryClassification(
            class_names, binarize_fn=lambda yh: (yh.sigmoid()>.5).long(), report_avg=True)
    else:
        raise NotImplementedError(f"I don't know how to create the result factory for {dset_spec}")
    return dct

class CheXpertMultiLabelBinaryClassification(TL.MultiLabelBinaryClassification):
    def update(self, yhat, y, loss) -> None:
        self.num_samples += yhat.shape[0]
        self.loss += loss.item()
        assert yhat.shape == y.shape
        assert yhat.ndim == 2 and yhat.shape[1] == len(self._cms), "sanity check: model outputs expected prediction shape"
        binarized = self._binarize_fn(yhat)
        assert binarized.dtype == T.long, 'sanity check binarize fn'
        assert binarized.shape == y.shape, 'sanity check binarize fn'
        ignore = (y != 2)  # ignore uncertainty labels
        for i, (kls, cm) in enumerate(self._cms.items()):
            rows = ignore[:, i]
            if rows.sum() == 0:
                continue  # don't update a confusion matrix if all data for this class is ignored
            cm += metrics.confusion_matrix(y[rows, i], binarized[rows, i], num_classes=2).cpu()


def get_deepfix_train_strategy(args:'TrainOptions'):
    deepfix_spec = args.deepfix
    if deepfix_spec == 'off':
        return TL.train_one_epoch
    elif deepfix_spec.startswith('reinit:'):
        _, N, P, R = deepfix_spec.split(':')
        return dfs.DeepFix_TrainOneEpoch(int(N), float(P), int(R), TL.train_one_epoch)
    elif deepfix_spec.startswith('dhist:'):
        fp = deepfix_spec.split(':', 1)[1]
        assert exists(fp), f'histogram file not found: {fp}'
        return dfs.DeepFix_DHist(fp)
    elif deepfix_spec.startswith('dfhist:'):
        fp = deepfix_spec.split(':', 1)[1]
        assert exists(fp), f'histogram file not found: {fp}'
        return dfs.DeepFix_DHist(fp, fixed=True)
    elif deepfix_spec == 'fixed':
        return dfs.DeepFix_DHist('', fixed=True, init_with_hist=False)
    elif deepfix_spec.startswith('beta:'):
        alpha, beta = deepfix_spec.split(':')[1:]
        return dfs.DeepFix_LambdaInit(
            lambda cfg: init_from_beta(cfg.model, float(alpha), float(beta)))
    elif deepfix_spec.startswith('ghaarconv2d:'):
        ignore_layers = deepfix_spec.split(':')[1].split(',')
        return dfs.DeepFix_LambdaInit(
            lambda cfg: (
                print(f'initialize {deepfix_spec}'),
                convert_conv2d_to_gHaarConv2d(cfg.model, ignore_layers=ignore_layers),
                reset_optimizer(args.opt, cfg.model),
                print(cfg.model)
            ))
    else:
        raise NotImplementedError(deepfix_spec)


def train_config(args:'TrainOptions') -> TL.TrainConfig:
    return TL.TrainConfig(
        **get_model_opt_loss(
            args.model, args.opt, args.lossfn, args.loss_reg, args.device),
        **get_dset_loaders_resultfactory(args.dset),
        device=args.device,
        epochs=args.epochs,
        start_epoch=args.start_epoch,
        train_one_epoch=get_deepfix_train_strategy(args),
        experiment_id=args.experiment_id,
    )


@dc.dataclass
class TrainOptions:
    """High-level configuration for training PyTorch models
    on the IntelMobileODTCervical dataset.
    """
    epochs:int = 50
    start_epoch:int = 0  # if "--start_epoch 1", then don't evaluate perf before training.
    device:str = 'cuda' if T.cuda.is_available() else 'cpu'
    dset:str = None #choice(
        #  'intel_mobileodt:train:val:test:v1',
        #  'intel_mobileodt:train+additional:val:test:v1',
        #  'intel_mobileodt:train+additional:noval:test:v1',
        #  'chexpert:.8:.2', 'chexpert:.01:.01', 'chexpert:.001:.001',
        #  'chexpert_small:.8:.2', 'chexpert_small:.01:.01',
        #   'chexpert_small:.001:.001',
        #  default='intel_mobileodt:train:val:test:v1')
    opt:str = 'SGD:lr=.001:momentum=.9:nesterov=1'
    lossfn:str = None  # choices:
        #  'BCEWithLogitsLoss',
        #  'CrossEntropyLoss', 
        #  'CE_intelmobileodt',
        #  'chexpert_uignore', 
        #  'chexpert_identity:N' for some N=num_identities predicted by model (compared to identities y%N)
    loss_reg:str = 'none'  # Optionally add a regularizer to the loss.  loss + reg.  Accepted values:  'none', 'deepfixmlp:X' where X is a positive float denoting the lambda in l1 regularizer
    model:str = 'resnet18:imagenet:3:3'  # Model specification adheres to the template "model_name:pretraining:in_ch:out_ch"
    deepfix:str = 'off'  # DeepFix Re-initialization Method.
                         #  "off" or "reinit:N:P:R" or "d[f]hist:path_to_histogram.pth"
                         #  or "beta:A:B" for A,B as (float) parameters of the beta distribution
                         # 'ghaarconv2d:layer1,layer2' Replaces all spatial convolutions with GHaarConv2d layer except the specified layers
    experiment_id:str = os.environ.get('run_id', 'debugging')
    prune:str = 'off'

    def execute(self):
        cfg = train_config(self)
        cfg.train(cfg)


def main():
    p = ArgumentParser()
    p.add_arguments(TrainOptions, dest='TrainOptions')
#     for patch_size in [1,32]:
#         for wavelet_level in [1,2,3,4,5,6,7,8,9]:    
#             try:
    in_ch, out_ch = 1, 14
    model_params = "efficientnet-b1:imagenet:"+str(in_ch)+":"+str(out_ch)    
    
#     model_params = "waveletmlp:300:1:14:"+str(patch_size)+":"+str(wavelet_level)+":1:2"
    exp_id = 'model_'+model_params+'_in_ch_'+str(in_ch)+'out_ch_'+str(out_ch)#+'_patch_size_' + str(patch_size) + '_level_' + str(wavelet_level)
    args = p.parse_args(["--dset", "chexpert_small:.01:.01", "--opt", "Adam:lr=0.001", "--lossfn", "chexpert_uignore", "--model", model_params, "--loss_reg", "none","--experiment_id",exp_id]).TrainOptions

    print(args)
    cfg = train_config(args)

# python deepfix/train.py --dset chexpert_small:.01:.01 --opt Adam:lr=0.001 --lossfn chexpert_uignore --model waveletmlp:300:1:14:7:1:1:2 --loss_reg none    

    if args.prune != 'off':
        assert args.prune.startswith('ChannelPrune:')
        raise NotImplementedError('code is a bit hardcoded, so it is not available without hacking on it.')
        print(args.prune)
        from explainfix import channelprune
        from deepfix.weight_saliency import costfn_multiclass
        a = sum([x.numel() for x in cfg.model.parameters()])
        channelprune(cfg.model, pct=5, grad_cost_fn=costfn_multiclass,
                     loader=cfg.train_loader, device=cfg.device, num_minibatches=10)
        b = sum([x.numel() for x in cfg.model.parameters()])
        assert a/b != 1
        print(f'done channelpruning.  {a/b}')

    cfg.train(cfg)
#             except Exception as e:
#                 print("=================================================================================================")
#                 print(e)
#                 print("=================================================================================================")
            
    print('+++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++')
    #  import IPython ; IPython.embed() ; import sys ; sys.exit()

    #  with T.profiler.profile(
    #      activities=[
    #          T.profiler.ProfilerActivity.CPU,
    #          T.profiler.ProfilerActivity.CUDA,
    #      ], with_modules=True,
    #  ) as p:
    #      cfg.train(cfg)
    #  print(p.key_averages().table(
    #      sort_by="self_cuda_time_total", row_limit=-1))


if __name__ == "__main__":
    main()


TrainOptions(epochs=50, start_epoch=0, device='cuda', dset='chexpert_small:.01:.01', opt='Adam:lr=0.001', lossfn='chexpert_uignore', loss_reg='none', model='efficientnet-b1:imagenet:1:14', deepfix='off', experiment_id='model_efficientnet-b1:imagenet:1:14_in_ch_1out_ch_14', prune='off')
Loaded pretrained weights for efficientnet-b1
Checkpoint ./results/model_efficientnet-b1:imagenet:1:14_in_ch_1out_ch_14/checkpoints/epoch_0.pth


100%|██████████| 149/149 [00:45<00:00,  3.25it/s]
100%|██████████| 149/149 [00:51<00:00,  2.87it/s]
100%|██████████| 16/16 [00:06<00:00,  2.50it/s]
INFO:simplepytorch.logging_tools:DataLogger writing to file: /ocean/projects/cie160013p/elvinj/DeepFix/deepfix/results/model_efficientnet-b1:imagenet:1:14_in_ch_1out_ch_14/log/20220130T044647.339098_perf.csv


[1m[32mepoch[0m:    0, [1m[32mseconds_training_epoch[0m: nan
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  101.47194, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.03497, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.04352, [1m[36mtrain_MCC Cardiomegaly[0m:  nan, [1m[36mtrain_MCC Lung Opacity[0m:  nan, [1m[36mtrain_MCC Lung Lesion[0m:  0.05939, [1m[36mtrain_MCC Edema[0m:  0.09511, [1m[36mtrain_MCC Consolidation[0m: -0.04160, [1m[36mtrain_MCC Pneumonia[0m:  0.00423, [1m[36mtrain_MCC Atelectasis[0m: -0.03738, [1m[36mtrain_MCC Pneumothorax[0m:  nan, [1m[36mtrain_MCC Pleural Effusion[0m:  0.01044, [1m[36mtrain_MCC Pleural Other[0m:  0.06170, [1m[36mtrain_MCC Fracture[0m:  0.01069, [1m[36mtrain_MCC Support Devices[0m: -0.02889, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.22222, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.05666, [1m[36mtrain_Prec

100%|██████████| 149/149 [01:12<00:00,  2.07it/s]
100%|██████████| 149/149 [00:38<00:00,  3.88it/s]
100%|██████████| 16/16 [00:05<00:00,  3.12it/s]


[1m[32mepoch[0m:    1, [1m[32mseconds_training_epoch[0m: 72.1138
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  55.33206, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m: -0.00675, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m: -0.01610, [1m[36mtrain_MCC Cardiomegaly[0m:  0.00657, [1m[36mtrain_MCC Lung Opacity[0m:  0.13877, [1m[36mtrain_MCC Lung Lesion[0m: -0.00596, [1m[36mtrain_MCC Edema[0m:  0.15896, [1m[36mtrain_MCC Consolidation[0m: -0.01964, [1m[36mtrain_MCC Pneumonia[0m:  0.02684, [1m[36mtrain_MCC Atelectasis[0m: -0.03107, [1m[36mtrain_MCC Pneumothorax[0m: -0.01773, [1m[36mtrain_MCC Pleural Effusion[0m:  0.19929, [1m[36mtrain_MCC Pleural Other[0m:  0.03606, [1m[36mtrain_MCC Fracture[0m: -0.01429, [1m[36mtrain_MCC Support Devices[0m:  0.21675, [1m[36mtrain_MCC AVG[0m:  0.04798, [1m[36mtrain_Precision No Finding[0m:  0.07692, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, 

100%|██████████| 149/149 [01:03<00:00,  2.36it/s]
100%|██████████| 149/149 [00:39<00:00,  3.82it/s]
100%|██████████| 16/16 [00:05<00:00,  3.09it/s]


[1m[32mepoch[0m:    2, [1m[32mseconds_training_epoch[0m: 63.0716
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  51.55201, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.02085, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.02296, [1m[36mtrain_MCC Lung Opacity[0m:  0.23288, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.20658, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  nan, [1m[36mtrain_MCC Pneumothorax[0m:  nan, [1m[36mtrain_MCC Pleural Effusion[0m:  0.35529, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.29213, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.17647, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Cardiomegal

100%|██████████| 149/149 [01:01<00:00,  2.42it/s]
100%|██████████| 149/149 [00:40<00:00,  3.71it/s]
100%|██████████| 16/16 [00:05<00:00,  3.04it/s]


[1m[32mepoch[0m:    3, [1m[32mseconds_training_epoch[0m: 61.6557
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  49.74460, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.13746, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.04698, [1m[36mtrain_MCC Lung Opacity[0m:  0.24617, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.28692, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m: -0.01033, [1m[36mtrain_MCC Pneumothorax[0m:  nan, [1m[36mtrain_MCC Pleural Effusion[0m:  0.41788, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.34025, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.44118, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Cardiom

100%|██████████| 149/149 [01:00<00:00,  2.46it/s]
100%|██████████| 149/149 [00:42<00:00,  3.53it/s]
100%|██████████| 16/16 [00:05<00:00,  3.15it/s]


[1m[32mepoch[0m:    4, [1m[32mseconds_training_epoch[0m: 60.6485
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  48.49139, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.21689, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.17932, [1m[36mtrain_MCC Lung Opacity[0m:  0.26056, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.27671, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  0.02926, [1m[36mtrain_MCC Pneumothorax[0m:  nan, [1m[36mtrain_MCC Pleural Effusion[0m:  0.46095, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.40145, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.52830, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Cardiom

100%|██████████| 149/149 [00:59<00:00,  2.50it/s]
100%|██████████| 149/149 [00:42<00:00,  3.47it/s]
100%|██████████| 16/16 [00:05<00:00,  3.04it/s]


[1m[32mepoch[0m:    5, [1m[32mseconds_training_epoch[0m: 59.6059
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  46.52825, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.33610, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.24992, [1m[36mtrain_MCC Lung Opacity[0m:  0.30519, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.35447, [1m[36mtrain_MCC Consolidation[0m:  nan, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  0.02624, [1m[36mtrain_MCC Pneumothorax[0m:  0.09685, [1m[36mtrain_MCC Pleural Effusion[0m:  0.47195, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.44402, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.61628, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision Car

100%|██████████| 149/149 [00:58<00:00,  2.55it/s]
100%|██████████| 149/149 [00:42<00:00,  3.49it/s]
100%|██████████| 16/16 [00:05<00:00,  3.13it/s]


[1m[32mepoch[0m:    6, [1m[32mseconds_training_epoch[0m: 58.4428
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  44.69687, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.32621, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.32927, [1m[36mtrain_MCC Lung Opacity[0m:  0.33461, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.45840, [1m[36mtrain_MCC Consolidation[0m: -0.00924, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  0.05376, [1m[36mtrain_MCC Pneumothorax[0m:  0.12770, [1m[36mtrain_MCC Pleural Effusion[0m:  0.53619, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.50431, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.55882, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision

100%|██████████| 149/149 [00:55<00:00,  2.67it/s]
100%|██████████| 149/149 [00:40<00:00,  3.70it/s]
100%|██████████| 16/16 [00:04<00:00,  3.87it/s]


[1m[32mepoch[0m:    7, [1m[32mseconds_training_epoch[0m: 55.7228
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  42.67041, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.37882, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.40313, [1m[36mtrain_MCC Lung Opacity[0m:  0.34064, [1m[36mtrain_MCC Lung Lesion[0m:  nan, [1m[36mtrain_MCC Edema[0m:  0.47250, [1m[36mtrain_MCC Consolidation[0m:  0.11217, [1m[36mtrain_MCC Pneumonia[0m:  nan, [1m[36mtrain_MCC Atelectasis[0m:  0.04438, [1m[36mtrain_MCC Pneumothorax[0m:  0.18514, [1m[36mtrain_MCC Pleural Effusion[0m:  0.50968, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  nan, [1m[36mtrain_MCC Support Devices[0m:  0.51667, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.59322, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36mtrain_Precision

100%|██████████| 149/149 [00:55<00:00,  2.68it/s]
100%|██████████| 149/149 [00:39<00:00,  3.79it/s]
100%|██████████| 16/16 [00:04<00:00,  3.88it/s]


[1m[32mepoch[0m:    8, [1m[32mseconds_training_epoch[0m: 55.5589
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  39.84921, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.54359, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.09330, [1m[36mtrain_MCC Cardiomegaly[0m:  0.44375, [1m[36mtrain_MCC Lung Opacity[0m:  0.41662, [1m[36mtrain_MCC Lung Lesion[0m: -0.00422, [1m[36mtrain_MCC Edema[0m:  0.53461, [1m[36mtrain_MCC Consolidation[0m:  0.19694, [1m[36mtrain_MCC Pneumonia[0m:  0.06107, [1m[36mtrain_MCC Atelectasis[0m:  0.12637, [1m[36mtrain_MCC Pneumothorax[0m:  0.40831, [1m[36mtrain_MCC Pleural Effusion[0m:  0.60300, [1m[36mtrain_MCC Pleural Other[0m:  nan, [1m[36mtrain_MCC Fracture[0m:  0.10450, [1m[36mtrain_MCC Support Devices[0m:  0.58617, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.70701, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  1.00000, [1m[36

100%|██████████| 149/149 [00:57<00:00,  2.58it/s]
100%|██████████| 149/149 [00:37<00:00,  3.93it/s]
100%|██████████| 16/16 [00:03<00:00,  4.01it/s]


[1m[32mepoch[0m:    9, [1m[32mseconds_training_epoch[0m: 57.7285
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  37.38031, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.54846, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  nan, [1m[36mtrain_MCC Cardiomegaly[0m:  0.55603, [1m[36mtrain_MCC Lung Opacity[0m:  0.42623, [1m[36mtrain_MCC Lung Lesion[0m:  0.07273, [1m[36mtrain_MCC Edema[0m:  0.58765, [1m[36mtrain_MCC Consolidation[0m:  0.13395, [1m[36mtrain_MCC Pneumonia[0m: -0.00423, [1m[36mtrain_MCC Atelectasis[0m:  0.21199, [1m[36mtrain_MCC Pneumothorax[0m:  0.42131, [1m[36mtrain_MCC Pleural Effusion[0m:  0.65891, [1m[36mtrain_MCC Pleural Other[0m: -0.00394, [1m[36mtrain_MCC Fracture[0m:  0.05539, [1m[36mtrain_MCC Support Devices[0m:  0.63210, [1m[36mtrain_MCC AVG[0m:  nan, [1m[36mtrain_Precision No Finding[0m:  0.70625, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.00000, [1m[36

100%|██████████| 149/149 [00:58<00:00,  2.56it/s]
100%|██████████| 149/149 [00:36<00:00,  4.06it/s]
100%|██████████| 16/16 [00:03<00:00,  4.03it/s]


[1m[32mepoch[0m:   10, [1m[32mseconds_training_epoch[0m: 58.2201
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  33.44237, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.62485, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.08828, [1m[36mtrain_MCC Cardiomegaly[0m:  0.63686, [1m[36mtrain_MCC Lung Opacity[0m:  0.46425, [1m[36mtrain_MCC Lung Lesion[0m:  0.18772, [1m[36mtrain_MCC Edema[0m:  0.65735, [1m[36mtrain_MCC Consolidation[0m:  0.34447, [1m[36mtrain_MCC Pneumonia[0m:  0.21176, [1m[36mtrain_MCC Atelectasis[0m:  0.29685, [1m[36mtrain_MCC Pneumothorax[0m:  0.51524, [1m[36mtrain_MCC Pleural Effusion[0m:  0.68689, [1m[36mtrain_MCC Pleural Other[0m:  0.24335, [1m[36mtrain_MCC Fracture[0m:  0.25625, [1m[36mtrain_MCC Support Devices[0m:  0.68990, [1m[36mtrain_MCC AVG[0m:  0.42172, [1m[36mtrain_Precision No Finding[0m:  0.75568, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.50000, 

100%|██████████| 149/149 [00:59<00:00,  2.52it/s]
100%|██████████| 149/149 [00:35<00:00,  4.20it/s]
100%|██████████| 16/16 [00:04<00:00,  3.93it/s]


[1m[32mepoch[0m:   11, [1m[32mseconds_training_epoch[0m: 59.113
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  30.64868, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.73714, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.23512, [1m[36mtrain_MCC Cardiomegaly[0m:  0.65322, [1m[36mtrain_MCC Lung Opacity[0m:  0.51428, [1m[36mtrain_MCC Lung Lesion[0m:  0.14565, [1m[36mtrain_MCC Edema[0m:  0.69115, [1m[36mtrain_MCC Consolidation[0m:  0.43511, [1m[36mtrain_MCC Pneumonia[0m:  0.35169, [1m[36mtrain_MCC Atelectasis[0m:  0.39303, [1m[36mtrain_MCC Pneumothorax[0m:  0.63344, [1m[36mtrain_MCC Pleural Effusion[0m:  0.70112, [1m[36mtrain_MCC Pleural Other[0m:  0.18092, [1m[36mtrain_MCC Fracture[0m:  0.36179, [1m[36mtrain_MCC Support Devices[0m:  0.72716, [1m[36mtrain_MCC AVG[0m:  0.48292, [1m[36mtrain_Precision No Finding[0m:  0.80383, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.66667, 

100%|██████████| 149/149 [01:01<00:00,  2.44it/s]
100%|██████████| 149/149 [00:34<00:00,  4.35it/s]
100%|██████████| 16/16 [00:04<00:00,  3.83it/s]


[1m[32mepoch[0m:   12, [1m[32mseconds_training_epoch[0m: 61.0999
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  27.32686, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.69408, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.25703, [1m[36mtrain_MCC Cardiomegaly[0m:  0.73364, [1m[36mtrain_MCC Lung Opacity[0m:  0.56462, [1m[36mtrain_MCC Lung Lesion[0m:  0.31473, [1m[36mtrain_MCC Edema[0m:  0.72079, [1m[36mtrain_MCC Consolidation[0m:  0.49386, [1m[36mtrain_MCC Pneumonia[0m:  0.28204, [1m[36mtrain_MCC Atelectasis[0m:  0.50850, [1m[36mtrain_MCC Pneumothorax[0m:  0.68771, [1m[36mtrain_MCC Pleural Effusion[0m:  0.78532, [1m[36mtrain_MCC Pleural Other[0m:  0.30645, [1m[36mtrain_MCC Fracture[0m:  0.45290, [1m[36mtrain_MCC Support Devices[0m:  0.74668, [1m[36mtrain_MCC AVG[0m:  0.53917, [1m[36mtrain_Precision No Finding[0m:  0.80645, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.61905, 

100%|██████████| 149/149 [01:01<00:00,  2.41it/s]
100%|██████████| 149/149 [00:33<00:00,  4.45it/s]
100%|██████████| 16/16 [00:04<00:00,  3.78it/s]


[1m[32mepoch[0m:   13, [1m[32mseconds_training_epoch[0m: 61.9429
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  22.78691, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.80219, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.40605, [1m[36mtrain_MCC Cardiomegaly[0m:  0.79030, [1m[36mtrain_MCC Lung Opacity[0m:  0.60009, [1m[36mtrain_MCC Lung Lesion[0m:  0.50896, [1m[36mtrain_MCC Edema[0m:  0.80548, [1m[36mtrain_MCC Consolidation[0m:  0.62606, [1m[36mtrain_MCC Pneumonia[0m:  0.48626, [1m[36mtrain_MCC Atelectasis[0m:  0.55678, [1m[36mtrain_MCC Pneumothorax[0m:  0.79091, [1m[36mtrain_MCC Pleural Effusion[0m:  0.80983, [1m[36mtrain_MCC Pleural Other[0m:  0.43253, [1m[36mtrain_MCC Fracture[0m:  0.67405, [1m[36mtrain_MCC Support Devices[0m:  0.80529, [1m[36mtrain_MCC AVG[0m:  0.64963, [1m[36mtrain_Precision No Finding[0m:  0.85185, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.80000, 

100%|██████████| 149/149 [01:02<00:00,  2.38it/s]
100%|██████████| 149/149 [00:33<00:00,  4.45it/s]
100%|██████████| 16/16 [00:04<00:00,  3.38it/s]


[1m[32mepoch[0m:   14, [1m[32mseconds_training_epoch[0m: 62.5491
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  19.14942, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.83966, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.53429, [1m[36mtrain_MCC Cardiomegaly[0m:  0.82583, [1m[36mtrain_MCC Lung Opacity[0m:  0.70472, [1m[36mtrain_MCC Lung Lesion[0m:  0.55779, [1m[36mtrain_MCC Edema[0m:  0.82832, [1m[36mtrain_MCC Consolidation[0m:  0.77387, [1m[36mtrain_MCC Pneumonia[0m:  0.58283, [1m[36mtrain_MCC Atelectasis[0m:  0.65842, [1m[36mtrain_MCC Pneumothorax[0m:  0.79532, [1m[36mtrain_MCC Pleural Effusion[0m:  0.84462, [1m[36mtrain_MCC Pleural Other[0m:  0.52963, [1m[36mtrain_MCC Fracture[0m:  0.65548, [1m[36mtrain_MCC Support Devices[0m:  0.83879, [1m[36mtrain_MCC AVG[0m:  0.71211, [1m[36mtrain_Precision No Finding[0m:  0.88479, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.76786, 

100%|██████████| 149/149 [01:01<00:00,  2.43it/s]
100%|██████████| 149/149 [00:34<00:00,  4.30it/s]
100%|██████████| 16/16 [00:04<00:00,  3.32it/s]


[1m[32mepoch[0m:   15, [1m[32mseconds_training_epoch[0m: 61.3
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  16.24847, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.87468, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.51811, [1m[36mtrain_MCC Cardiomegaly[0m:  0.84842, [1m[36mtrain_MCC Lung Opacity[0m:  0.74969, [1m[36mtrain_MCC Lung Lesion[0m:  0.63141, [1m[36mtrain_MCC Edema[0m:  0.87547, [1m[36mtrain_MCC Consolidation[0m:  0.77462, [1m[36mtrain_MCC Pneumonia[0m:  0.66936, [1m[36mtrain_MCC Atelectasis[0m:  0.73441, [1m[36mtrain_MCC Pneumothorax[0m:  0.84760, [1m[36mtrain_MCC Pleural Effusion[0m:  0.85416, [1m[36mtrain_MCC Pleural Other[0m:  0.76895, [1m[36mtrain_MCC Fracture[0m:  0.71642, [1m[36mtrain_MCC Support Devices[0m:  0.86756, [1m[36mtrain_MCC AVG[0m:  0.76649, [1m[36mtrain_Precision No Finding[0m:  0.91324, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.75926, [1

100%|██████████| 149/149 [00:59<00:00,  2.49it/s]
100%|██████████| 149/149 [00:36<00:00,  4.12it/s]
100%|██████████| 16/16 [00:04<00:00,  3.34it/s]


[1m[32mepoch[0m:   16, [1m[32mseconds_training_epoch[0m: 59.8045
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  14.95836, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.86532, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.67883, [1m[36mtrain_MCC Cardiomegaly[0m:  0.85276, [1m[36mtrain_MCC Lung Opacity[0m:  0.79456, [1m[36mtrain_MCC Lung Lesion[0m:  0.71144, [1m[36mtrain_MCC Edema[0m:  0.87198, [1m[36mtrain_MCC Consolidation[0m:  0.77341, [1m[36mtrain_MCC Pneumonia[0m:  0.74480, [1m[36mtrain_MCC Atelectasis[0m:  0.78963, [1m[36mtrain_MCC Pneumothorax[0m:  0.85218, [1m[36mtrain_MCC Pleural Effusion[0m:  0.85207, [1m[36mtrain_MCC Pleural Other[0m:  0.68633, [1m[36mtrain_MCC Fracture[0m:  0.78389, [1m[36mtrain_MCC Support Devices[0m:  0.86748, [1m[36mtrain_MCC AVG[0m:  0.79462, [1m[36mtrain_Precision No Finding[0m:  0.87931, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.82895, 

100%|██████████| 149/149 [00:58<00:00,  2.53it/s]
100%|██████████| 149/149 [00:36<00:00,  4.08it/s]
100%|██████████| 16/16 [00:04<00:00,  3.29it/s]


[1m[32mepoch[0m:   17, [1m[32mseconds_training_epoch[0m: 58.8239
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  12.36943, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.87278, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.75196, [1m[36mtrain_MCC Cardiomegaly[0m:  0.87479, [1m[36mtrain_MCC Lung Opacity[0m:  0.80465, [1m[36mtrain_MCC Lung Lesion[0m:  0.78830, [1m[36mtrain_MCC Edema[0m:  0.88686, [1m[36mtrain_MCC Consolidation[0m:  0.81209, [1m[36mtrain_MCC Pneumonia[0m:  0.76652, [1m[36mtrain_MCC Atelectasis[0m:  0.85515, [1m[36mtrain_MCC Pneumothorax[0m:  0.85818, [1m[36mtrain_MCC Pleural Effusion[0m:  0.88644, [1m[36mtrain_MCC Pleural Other[0m:  0.77074, [1m[36mtrain_MCC Fracture[0m:  0.85584, [1m[36mtrain_MCC Support Devices[0m:  0.91166, [1m[36mtrain_MCC AVG[0m:  0.83543, [1m[36mtrain_Precision No Finding[0m:  0.90541, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.86905, 

100%|██████████| 149/149 [00:58<00:00,  2.57it/s]
100%|██████████| 149/149 [00:37<00:00,  3.93it/s]
100%|██████████| 16/16 [00:04<00:00,  3.33it/s]


[1m[32mepoch[0m:   18, [1m[32mseconds_training_epoch[0m: 58.0596
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  11.75731, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.83953, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.81477, [1m[36mtrain_MCC Cardiomegaly[0m:  0.87247, [1m[36mtrain_MCC Lung Opacity[0m:  0.84135, [1m[36mtrain_MCC Lung Lesion[0m:  0.80676, [1m[36mtrain_MCC Edema[0m:  0.88263, [1m[36mtrain_MCC Consolidation[0m:  0.80003, [1m[36mtrain_MCC Pneumonia[0m:  0.82624, [1m[36mtrain_MCC Atelectasis[0m:  0.83192, [1m[36mtrain_MCC Pneumothorax[0m:  0.86976, [1m[36mtrain_MCC Pleural Effusion[0m:  0.90022, [1m[36mtrain_MCC Pleural Other[0m:  0.85409, [1m[36mtrain_MCC Fracture[0m:  0.88319, [1m[36mtrain_MCC Support Devices[0m:  0.89811, [1m[36mtrain_MCC AVG[0m:  0.85151, [1m[36mtrain_Precision No Finding[0m:  0.86726, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.90110, 

100%|██████████| 149/149 [00:56<00:00,  2.63it/s]
100%|██████████| 149/149 [00:38<00:00,  3.84it/s]
100%|██████████| 16/16 [00:04<00:00,  3.35it/s]


[1m[32mepoch[0m:   19, [1m[32mseconds_training_epoch[0m: 56.5811
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  9.90894, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.90687, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.83096, [1m[36mtrain_MCC Cardiomegaly[0m:  0.91905, [1m[36mtrain_MCC Lung Opacity[0m:  0.87527, [1m[36mtrain_MCC Lung Lesion[0m:  0.77916, [1m[36mtrain_MCC Edema[0m:  0.92410, [1m[36mtrain_MCC Consolidation[0m:  0.85621, [1m[36mtrain_MCC Pneumonia[0m:  0.88987, [1m[36mtrain_MCC Atelectasis[0m:  0.83913, [1m[36mtrain_MCC Pneumothorax[0m:  0.88719, [1m[36mtrain_MCC Pleural Effusion[0m:  0.91886, [1m[36mtrain_MCC Pleural Other[0m:  0.88408, [1m[36mtrain_MCC Fracture[0m:  0.90812, [1m[36mtrain_MCC Support Devices[0m:  0.92260, [1m[36mtrain_MCC AVG[0m:  0.88153, [1m[36mtrain_Precision No Finding[0m:  0.94091, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.91304, 

100%|██████████| 149/149 [00:55<00:00,  2.68it/s]
100%|██████████| 149/149 [00:39<00:00,  3.75it/s]
100%|██████████| 16/16 [00:04<00:00,  3.25it/s]


[1m[32mepoch[0m:   20, [1m[32mseconds_training_epoch[0m: 55.5177
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  9.89467, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.92079, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.90577, [1m[36mtrain_MCC Cardiomegaly[0m:  0.90576, [1m[36mtrain_MCC Lung Opacity[0m:  0.85235, [1m[36mtrain_MCC Lung Lesion[0m:  0.81532, [1m[36mtrain_MCC Edema[0m:  0.92284, [1m[36mtrain_MCC Consolidation[0m:  0.83344, [1m[36mtrain_MCC Pneumonia[0m:  0.82806, [1m[36mtrain_MCC Atelectasis[0m:  0.86022, [1m[36mtrain_MCC Pneumothorax[0m:  0.90903, [1m[36mtrain_MCC Pleural Effusion[0m:  0.90605, [1m[36mtrain_MCC Pleural Other[0m:  0.84332, [1m[36mtrain_MCC Fracture[0m:  0.96400, [1m[36mtrain_MCC Support Devices[0m:  0.88909, [1m[36mtrain_MCC AVG[0m:  0.88257, [1m[36mtrain_Precision No Finding[0m:  0.92704, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.94118, 

100%|██████████| 149/149 [00:54<00:00,  2.72it/s]
100%|██████████| 149/149 [00:40<00:00,  3.70it/s]
100%|██████████| 16/16 [00:04<00:00,  3.51it/s]


[1m[32mepoch[0m:   21, [1m[32mseconds_training_epoch[0m: 54.8065
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  8.73043, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.89990, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.86584, [1m[36mtrain_MCC Cardiomegaly[0m:  0.90802, [1m[36mtrain_MCC Lung Opacity[0m:  0.89089, [1m[36mtrain_MCC Lung Lesion[0m:  0.87844, [1m[36mtrain_MCC Edema[0m:  0.91277, [1m[36mtrain_MCC Consolidation[0m:  0.91019, [1m[36mtrain_MCC Pneumonia[0m:  0.86165, [1m[36mtrain_MCC Atelectasis[0m:  0.89223, [1m[36mtrain_MCC Pneumothorax[0m:  0.93780, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93356, [1m[36mtrain_MCC Pleural Other[0m:  0.91445, [1m[36mtrain_MCC Fracture[0m:  0.93354, [1m[36mtrain_MCC Support Devices[0m:  0.93329, [1m[36mtrain_MCC AVG[0m:  0.90518, [1m[36mtrain_Precision No Finding[0m:  0.92825, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.90196, 

100%|██████████| 149/149 [00:55<00:00,  2.68it/s]
100%|██████████| 149/149 [00:39<00:00,  3.76it/s]
100%|██████████| 16/16 [00:04<00:00,  3.99it/s]


[1m[32mepoch[0m:   22, [1m[32mseconds_training_epoch[0m: 55.638
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  7.86787, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.91567, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.87379, [1m[36mtrain_MCC Cardiomegaly[0m:  0.92483, [1m[36mtrain_MCC Lung Opacity[0m:  0.89912, [1m[36mtrain_MCC Lung Lesion[0m:  0.85040, [1m[36mtrain_MCC Edema[0m:  0.92329, [1m[36mtrain_MCC Consolidation[0m:  0.89751, [1m[36mtrain_MCC Pneumonia[0m:  0.89878, [1m[36mtrain_MCC Atelectasis[0m:  0.90566, [1m[36mtrain_MCC Pneumothorax[0m:  0.93242, [1m[36mtrain_MCC Pleural Effusion[0m:  0.92565, [1m[36mtrain_MCC Pleural Other[0m:  0.92928, [1m[36mtrain_MCC Fracture[0m:  0.89628, [1m[36mtrain_MCC Support Devices[0m:  0.91983, [1m[36mtrain_MCC AVG[0m:  0.90661, [1m[36mtrain_Precision No Finding[0m:  0.92641, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.93750, [

100%|██████████| 149/149 [00:56<00:00,  2.65it/s]
100%|██████████| 149/149 [00:38<00:00,  3.87it/s]
100%|██████████| 16/16 [00:03<00:00,  4.05it/s]


[1m[32mepoch[0m:   23, [1m[32mseconds_training_epoch[0m: 56.1255
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  7.40673, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95210, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.89473, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93372, [1m[36mtrain_MCC Lung Opacity[0m:  0.90004, [1m[36mtrain_MCC Lung Lesion[0m:  0.89012, [1m[36mtrain_MCC Edema[0m:  0.93237, [1m[36mtrain_MCC Consolidation[0m:  0.90979, [1m[36mtrain_MCC Pneumonia[0m:  0.91338, [1m[36mtrain_MCC Atelectasis[0m:  0.92038, [1m[36mtrain_MCC Pneumothorax[0m:  0.90926, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93250, [1m[36mtrain_MCC Pleural Other[0m:  0.92928, [1m[36mtrain_MCC Fracture[0m:  0.92770, [1m[36mtrain_MCC Support Devices[0m:  0.91707, [1m[36mtrain_MCC AVG[0m:  0.91875, [1m[36mtrain_Precision No Finding[0m:  0.95299, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.94898, 

100%|██████████| 149/149 [00:57<00:00,  2.60it/s]
100%|██████████| 149/149 [00:37<00:00,  4.00it/s]
100%|██████████| 16/16 [00:04<00:00,  4.00it/s]


[1m[32mepoch[0m:   24, [1m[32mseconds_training_epoch[0m: 57.2591
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  6.62683, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.91436, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.89473, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93594, [1m[36mtrain_MCC Lung Opacity[0m:  0.91840, [1m[36mtrain_MCC Lung Lesion[0m:  0.92380, [1m[36mtrain_MCC Edema[0m:  0.93442, [1m[36mtrain_MCC Consolidation[0m:  0.94373, [1m[36mtrain_MCC Pneumonia[0m:  0.89809, [1m[36mtrain_MCC Atelectasis[0m:  0.94366, [1m[36mtrain_MCC Pneumothorax[0m:  0.95800, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93253, [1m[36mtrain_MCC Pleural Other[0m:  0.93044, [1m[36mtrain_MCC Fracture[0m:  0.96400, [1m[36mtrain_MCC Support Devices[0m:  0.93508, [1m[36mtrain_MCC AVG[0m:  0.93051, [1m[36mtrain_Precision No Finding[0m:  0.94570, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.94898, 

100%|██████████| 149/149 [00:58<00:00,  2.54it/s]
100%|██████████| 149/149 [00:36<00:00,  4.13it/s]
100%|██████████| 16/16 [00:04<00:00,  3.97it/s]


[1m[32mepoch[0m:   25, [1m[32mseconds_training_epoch[0m: 58.5742
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  6.22304, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.93937, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95579, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94090, [1m[36mtrain_MCC Lung Opacity[0m:  0.90554, [1m[36mtrain_MCC Lung Lesion[0m:  0.95611, [1m[36mtrain_MCC Edema[0m:  0.94362, [1m[36mtrain_MCC Consolidation[0m:  0.93300, [1m[36mtrain_MCC Pneumonia[0m:  0.90644, [1m[36mtrain_MCC Atelectasis[0m:  0.91432, [1m[36mtrain_MCC Pneumothorax[0m:  0.95829, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93544, [1m[36mtrain_MCC Pleural Other[0m:  0.92891, [1m[36mtrain_MCC Fracture[0m:  0.91560, [1m[36mtrain_MCC Support Devices[0m:  0.93329, [1m[36mtrain_MCC AVG[0m:  0.93333, [1m[36mtrain_Precision No Finding[0m:  0.95595, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.98077, 

100%|██████████| 149/149 [01:00<00:00,  2.48it/s]
100%|██████████| 149/149 [00:34<00:00,  4.32it/s]
100%|██████████| 16/16 [00:03<00:00,  4.06it/s]


[1m[32mepoch[0m:   26, [1m[32mseconds_training_epoch[0m: 60.182
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.62170, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94439, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.93089, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94242, [1m[36mtrain_MCC Lung Opacity[0m:  0.93492, [1m[36mtrain_MCC Lung Lesion[0m:  0.95611, [1m[36mtrain_MCC Edema[0m:  0.95262, [1m[36mtrain_MCC Consolidation[0m:  0.96677, [1m[36mtrain_MCC Pneumonia[0m:  0.96449, [1m[36mtrain_MCC Atelectasis[0m:  0.92053, [1m[36mtrain_MCC Pneumothorax[0m:  0.95503, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94523, [1m[36mtrain_MCC Pleural Other[0m:  0.90258, [1m[36mtrain_MCC Fracture[0m:  0.91500, [1m[36mtrain_MCC Support Devices[0m:  0.93783, [1m[36mtrain_MCC AVG[0m:  0.94063, [1m[36mtrain_Precision No Finding[0m:  0.95633, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96117, [

100%|██████████| 149/149 [01:00<00:00,  2.45it/s]
100%|██████████| 149/149 [00:33<00:00,  4.40it/s]
100%|██████████| 16/16 [00:04<00:00,  3.82it/s]


[1m[32mepoch[0m:   27, [1m[32mseconds_training_epoch[0m: 60.863
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  6.24163, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.93704, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.92659, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95122, [1m[36mtrain_MCC Lung Opacity[0m:  0.90554, [1m[36mtrain_MCC Lung Lesion[0m:  0.94965, [1m[36mtrain_MCC Edema[0m:  0.94637, [1m[36mtrain_MCC Consolidation[0m:  0.92490, [1m[36mtrain_MCC Pneumonia[0m:  0.94993, [1m[36mtrain_MCC Atelectasis[0m:  0.89411, [1m[36mtrain_MCC Pneumothorax[0m:  0.97201, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94914, [1m[36mtrain_MCC Pleural Other[0m:  0.91445, [1m[36mtrain_MCC Fracture[0m:  0.92724, [1m[36mtrain_MCC Support Devices[0m:  0.93688, [1m[36mtrain_MCC AVG[0m:  0.93465, [1m[36mtrain_Precision No Finding[0m:  0.95175, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.94340, [

100%|██████████| 149/149 [01:02<00:00,  2.39it/s]
100%|██████████| 149/149 [00:33<00:00,  4.51it/s]
100%|██████████| 16/16 [00:04<00:00,  3.73it/s]


[1m[32mepoch[0m:   28, [1m[32mseconds_training_epoch[0m: 62.2561
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  6.07671, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.93704, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94082, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94257, [1m[36mtrain_MCC Lung Opacity[0m:  0.93031, [1m[36mtrain_MCC Lung Lesion[0m:  0.93092, [1m[36mtrain_MCC Edema[0m:  0.95392, [1m[36mtrain_MCC Consolidation[0m:  0.95557, [1m[36mtrain_MCC Pneumonia[0m:  0.92993, [1m[36mtrain_MCC Atelectasis[0m:  0.92629, [1m[36mtrain_MCC Pneumothorax[0m:  0.93263, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95601, [1m[36mtrain_MCC Pleural Other[0m:  0.87197, [1m[36mtrain_MCC Fracture[0m:  0.88045, [1m[36mtrain_MCC Support Devices[0m:  0.93599, [1m[36mtrain_MCC AVG[0m:  0.93032, [1m[36mtrain_Precision No Finding[0m:  0.95175, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97087, 

100%|██████████| 149/149 [01:02<00:00,  2.40it/s]
100%|██████████| 149/149 [00:33<00:00,  4.44it/s]
100%|██████████| 16/16 [00:04<00:00,  3.36it/s]


[1m[32mepoch[0m:   29, [1m[32mseconds_training_epoch[0m: 62.0958
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.76025, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94422, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.93060, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94494, [1m[36mtrain_MCC Lung Opacity[0m:  0.91565, [1m[36mtrain_MCC Lung Lesion[0m:  0.91833, [1m[36mtrain_MCC Edema[0m:  0.94499, [1m[36mtrain_MCC Consolidation[0m:  0.95522, [1m[36mtrain_MCC Pneumonia[0m:  0.94257, [1m[36mtrain_MCC Atelectasis[0m:  0.95540, [1m[36mtrain_MCC Pneumothorax[0m:  0.93049, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95503, [1m[36mtrain_MCC Pleural Other[0m:  0.92928, [1m[36mtrain_MCC Fracture[0m:  0.93980, [1m[36mtrain_MCC Support Devices[0m:  0.93238, [1m[36mtrain_MCC AVG[0m:  0.93849, [1m[36mtrain_Precision No Finding[0m:  0.96035, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97030, 

100%|██████████| 149/149 [01:00<00:00,  2.44it/s]
100%|██████████| 149/149 [00:34<00:00,  4.26it/s]
100%|██████████| 16/16 [00:04<00:00,  3.37it/s]


[1m[32mepoch[0m:   30, [1m[32mseconds_training_epoch[0m: 60.957
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.80217, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94658, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94082, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93334, [1m[36mtrain_MCC Lung Opacity[0m:  0.92756, [1m[36mtrain_MCC Lung Lesion[0m:  0.93698, [1m[36mtrain_MCC Edema[0m:  0.94619, [1m[36mtrain_MCC Consolidation[0m:  0.92984, [1m[36mtrain_MCC Pneumonia[0m:  0.90644, [1m[36mtrain_MCC Atelectasis[0m:  0.94802, [1m[36mtrain_MCC Pneumothorax[0m:  0.91309, [1m[36mtrain_MCC Pleural Effusion[0m:  0.94718, [1m[36mtrain_MCC Pleural Other[0m:  0.90258, [1m[36mtrain_MCC Fracture[0m:  0.97060, [1m[36mtrain_MCC Support Devices[0m:  0.92336, [1m[36mtrain_MCC AVG[0m:  0.93376, [1m[36mtrain_Precision No Finding[0m:  0.96460, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97087, [

100%|██████████| 149/149 [00:59<00:00,  2.49it/s]
100%|██████████| 149/149 [00:36<00:00,  4.12it/s]
100%|██████████| 16/16 [00:04<00:00,  3.29it/s]


[1m[32mepoch[0m:   31, [1m[32mseconds_training_epoch[0m: 59.8879
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.36340, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95173, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.93127, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95122, [1m[36mtrain_MCC Lung Opacity[0m:  0.93764, [1m[36mtrain_MCC Lung Lesion[0m:  0.85537, [1m[36mtrain_MCC Edema[0m:  0.94755, [1m[36mtrain_MCC Consolidation[0m:  0.96697, [1m[36mtrain_MCC Pneumonia[0m:  0.97170, [1m[36mtrain_MCC Atelectasis[0m:  0.90566, [1m[36mtrain_MCC Pneumothorax[0m:  0.95829, [1m[36mtrain_MCC Pleural Effusion[0m:  0.93935, [1m[36mtrain_MCC Pleural Other[0m:  0.91445, [1m[36mtrain_MCC Fracture[0m:  0.92197, [1m[36mtrain_MCC Support Devices[0m:  0.95674, [1m[36mtrain_MCC AVG[0m:  0.93642, [1m[36mtrain_Precision No Finding[0m:  0.96087, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.95238, 

100%|██████████| 149/149 [00:58<00:00,  2.55it/s]
100%|██████████| 149/149 [00:37<00:00,  4.01it/s]
100%|██████████| 16/16 [00:04<00:00,  3.35it/s]


[1m[32mepoch[0m:   32, [1m[32mseconds_training_epoch[0m: 58.3984
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.89553, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96386, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.88045, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95741, [1m[36mtrain_MCC Lung Opacity[0m:  0.93672, [1m[36mtrain_MCC Lung Lesion[0m:  0.93643, [1m[36mtrain_MCC Edema[0m:  0.95771, [1m[36mtrain_MCC Consolidation[0m:  0.95918, [1m[36mtrain_MCC Pneumonia[0m:  0.91405, [1m[36mtrain_MCC Atelectasis[0m:  0.94373, [1m[36mtrain_MCC Pneumothorax[0m:  0.94938, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96778, [1m[36mtrain_MCC Pleural Other[0m:  0.94390, [1m[36mtrain_MCC Fracture[0m:  0.97028, [1m[36mtrain_MCC Support Devices[0m:  0.93509, [1m[36mtrain_MCC AVG[0m:  0.94400, [1m[36mtrain_Precision No Finding[0m:  0.96970, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.92079, 

100%|██████████| 149/149 [00:56<00:00,  2.62it/s]
100%|██████████| 149/149 [00:38<00:00,  3.87it/s]
100%|██████████| 16/16 [00:04<00:00,  3.29it/s]


[1m[32mepoch[0m:   33, [1m[32mseconds_training_epoch[0m: 56.9745
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.31193, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94439, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.90634, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95315, [1m[36mtrain_MCC Lung Opacity[0m:  0.92572, [1m[36mtrain_MCC Lung Lesion[0m:  0.97525, [1m[36mtrain_MCC Edema[0m:  0.95251, [1m[36mtrain_MCC Consolidation[0m:  0.92128, [1m[36mtrain_MCC Pneumonia[0m:  0.96442, [1m[36mtrain_MCC Atelectasis[0m:  0.94960, [1m[36mtrain_MCC Pneumothorax[0m:  0.94717, [1m[36mtrain_MCC Pleural Effusion[0m:  0.92376, [1m[36mtrain_MCC Pleural Other[0m:  0.94390, [1m[36mtrain_MCC Fracture[0m:  0.97615, [1m[36mtrain_MCC Support Devices[0m:  0.95944, [1m[36mtrain_MCC AVG[0m:  0.94593, [1m[36mtrain_Precision No Finding[0m:  0.95633, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.93269, 

100%|██████████| 149/149 [00:55<00:00,  2.68it/s]
100%|██████████| 149/149 [00:39<00:00,  3.76it/s]
100%|██████████| 16/16 [00:04<00:00,  3.33it/s]


[1m[32mepoch[0m:   34, [1m[32mseconds_training_epoch[0m: 55.6425
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.18274, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96858, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95096, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95357, [1m[36mtrain_MCC Lung Opacity[0m:  0.94039, [1m[36mtrain_MCC Lung Lesion[0m:  0.96926, [1m[36mtrain_MCC Edema[0m:  0.97575, [1m[36mtrain_MCC Consolidation[0m:  0.95903, [1m[36mtrain_MCC Pneumonia[0m:  0.94394, [1m[36mtrain_MCC Atelectasis[0m:  0.92629, [1m[36mtrain_MCC Pneumothorax[0m:  0.95526, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95409, [1m[36mtrain_MCC Pleural Other[0m:  0.98617, [1m[36mtrain_MCC Fracture[0m:  0.97004, [1m[36mtrain_MCC Support Devices[0m:  0.97207, [1m[36mtrain_MCC AVG[0m:  0.95896, [1m[36mtrain_Precision No Finding[0m:  0.97817, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97143, 

100%|██████████| 149/149 [00:54<00:00,  2.72it/s]
100%|██████████| 149/149 [00:40<00:00,  3.72it/s]
100%|██████████| 16/16 [00:04<00:00,  3.26it/s]


[1m[32mepoch[0m:   35, [1m[32mseconds_training_epoch[0m: 54.7375
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.23294, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94422, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94082, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94071, [1m[36mtrain_MCC Lung Opacity[0m:  0.94497, [1m[36mtrain_MCC Lung Lesion[0m:  0.92380, [1m[36mtrain_MCC Edema[0m:  0.93369, [1m[36mtrain_MCC Consolidation[0m:  0.92881, [1m[36mtrain_MCC Pneumonia[0m:  0.92094, [1m[36mtrain_MCC Atelectasis[0m:  0.93246, [1m[36mtrain_MCC Pneumothorax[0m:  0.93578, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95606, [1m[36mtrain_MCC Pleural Other[0m:  0.94679, [1m[36mtrain_MCC Fracture[0m:  0.93980, [1m[36mtrain_MCC Support Devices[0m:  0.95222, [1m[36mtrain_MCC AVG[0m:  0.93865, [1m[36mtrain_Precision No Finding[0m:  0.96035, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97087, 

100%|██████████| 149/149 [00:55<00:00,  2.71it/s]
100%|██████████| 149/149 [00:39<00:00,  3.73it/s]
100%|██████████| 16/16 [00:04<00:00,  3.83it/s]


[1m[32mepoch[0m:   36, [1m[32mseconds_training_epoch[0m: 55.0648
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  5.32648, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96633, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96070, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95534, [1m[36mtrain_MCC Lung Opacity[0m:  0.93122, [1m[36mtrain_MCC Lung Lesion[0m:  0.96253, [1m[36mtrain_MCC Edema[0m:  0.92692, [1m[36mtrain_MCC Consolidation[0m:  0.94461, [1m[36mtrain_MCC Pneumonia[0m:  0.90576, [1m[36mtrain_MCC Atelectasis[0m:  0.94581, [1m[36mtrain_MCC Pneumothorax[0m:  0.94098, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95210, [1m[36mtrain_MCC Pleural Other[0m:  0.94353, [1m[36mtrain_MCC Fracture[0m:  0.94603, [1m[36mtrain_MCC Support Devices[0m:  0.94597, [1m[36mtrain_MCC AVG[0m:  0.94484, [1m[36mtrain_Precision No Finding[0m:  0.96983, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.99029, 

100%|██████████| 149/149 [00:55<00:00,  2.68it/s]
100%|██████████| 149/149 [00:39<00:00,  3.80it/s]
100%|██████████| 16/16 [00:03<00:00,  4.06it/s]


[1m[32mepoch[0m:   37, [1m[32mseconds_training_epoch[0m: 55.5851
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.95160, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.97350, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94657, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95315, [1m[36mtrain_MCC Lung Opacity[0m:  0.94956, [1m[36mtrain_MCC Lung Lesion[0m:  0.92497, [1m[36mtrain_MCC Edema[0m:  0.96543, [1m[36mtrain_MCC Consolidation[0m:  0.95537, [1m[36mtrain_MCC Pneumonia[0m:  0.94330, [1m[36mtrain_MCC Atelectasis[0m:  0.94978, [1m[36mtrain_MCC Pneumothorax[0m:  0.96646, [1m[36mtrain_MCC Pleural Effusion[0m:  0.97655, [1m[36mtrain_MCC Pleural Other[0m:  0.95831, [1m[36mtrain_MCC Fracture[0m:  0.97009, [1m[36mtrain_MCC Support Devices[0m:  0.95853, [1m[36mtrain_MCC AVG[0m:  0.95654, [1m[36mtrain_Precision No Finding[0m:  0.97835, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.95370, 

100%|██████████| 149/149 [00:56<00:00,  2.62it/s]
100%|██████████| 149/149 [00:38<00:00,  3.89it/s]
100%|██████████| 16/16 [00:04<00:00,  3.99it/s]


[1m[32mepoch[0m:   38, [1m[32mseconds_training_epoch[0m: 56.8603
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.15588, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96868, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.98053, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96819, [1m[36mtrain_MCC Lung Opacity[0m:  0.94407, [1m[36mtrain_MCC Lung Lesion[0m:  0.95001, [1m[36mtrain_MCC Edema[0m:  0.95795, [1m[36mtrain_MCC Consolidation[0m:  0.97774, [1m[36mtrain_MCC Pneumonia[0m:  0.91405, [1m[36mtrain_MCC Atelectasis[0m:  0.94217, [1m[36mtrain_MCC Pneumothorax[0m:  0.96638, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95894, [1m[36mtrain_MCC Pleural Other[0m:  0.98617, [1m[36mtrain_MCC Fracture[0m:  0.96400, [1m[36mtrain_MCC Support Devices[0m:  0.95673, [1m[36mtrain_MCC AVG[0m:  0.95969, [1m[36mtrain_Precision No Finding[0m:  0.97403, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.99065, 

100%|██████████| 149/149 [00:58<00:00,  2.56it/s]
100%|██████████| 149/149 [00:37<00:00,  4.00it/s]
100%|██████████| 16/16 [00:04<00:00,  3.91it/s]


[1m[32mepoch[0m:   39, [1m[32mseconds_training_epoch[0m: 58.2263
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.17595, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96139, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.93686, [1m[36mtrain_MCC Cardiomegaly[0m:  0.96370, [1m[36mtrain_MCC Lung Opacity[0m:  0.94406, [1m[36mtrain_MCC Lung Lesion[0m:  0.93749, [1m[36mtrain_MCC Edema[0m:  0.98080, [1m[36mtrain_MCC Consolidation[0m:  0.95175, [1m[36mtrain_MCC Pneumonia[0m:  0.95129, [1m[36mtrain_MCC Atelectasis[0m:  0.96512, [1m[36mtrain_MCC Pneumothorax[0m:  0.97489, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95508, [1m[36mtrain_MCC Pleural Other[0m:  0.98617, [1m[36mtrain_MCC Fracture[0m:  0.93459, [1m[36mtrain_MCC Support Devices[0m:  0.94861, [1m[36mtrain_MCC AVG[0m:  0.95656, [1m[36mtrain_Precision No Finding[0m:  0.96957, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.94444, 

100%|██████████| 149/149 [00:59<00:00,  2.51it/s]
100%|██████████| 149/149 [00:35<00:00,  4.14it/s]
100%|██████████| 16/16 [00:04<00:00,  3.95it/s]


[1m[32mepoch[0m:   40, [1m[32mseconds_training_epoch[0m: 59.4778
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.37563, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96374, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.92714, [1m[36mtrain_MCC Cardiomegaly[0m:  0.93203, [1m[36mtrain_MCC Lung Opacity[0m:  0.94316, [1m[36mtrain_MCC Lung Lesion[0m:  0.96891, [1m[36mtrain_MCC Edema[0m:  0.95783, [1m[36mtrain_MCC Consolidation[0m:  0.97028, [1m[36mtrain_MCC Pneumonia[0m:  0.95019, [1m[36mtrain_MCC Atelectasis[0m:  0.93418, [1m[36mtrain_MCC Pneumothorax[0m:  0.96361, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95991, [1m[36mtrain_MCC Pleural Other[0m:  0.98617, [1m[36mtrain_MCC Fracture[0m:  0.96418, [1m[36mtrain_MCC Support Devices[0m:  0.94682, [1m[36mtrain_MCC AVG[0m:  0.95487, [1m[36mtrain_Precision No Finding[0m:  0.97380, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.93519, 

100%|██████████| 149/149 [01:00<00:00,  2.45it/s]
100%|██████████| 149/149 [00:34<00:00,  4.29it/s]
100%|██████████| 16/16 [00:04<00:00,  3.99it/s]


[1m[32mepoch[0m:   41, [1m[32mseconds_training_epoch[0m: 60.7775
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.49544, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.92559, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.92574, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94036, [1m[36mtrain_MCC Lung Opacity[0m:  0.94315, [1m[36mtrain_MCC Lung Lesion[0m:  0.96926, [1m[36mtrain_MCC Edema[0m:  0.95909, [1m[36mtrain_MCC Consolidation[0m:  0.95918, [1m[36mtrain_MCC Pneumonia[0m:  0.95019, [1m[36mtrain_MCC Atelectasis[0m:  0.96715, [1m[36mtrain_MCC Pneumothorax[0m:  0.95006, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95306, [1m[36mtrain_MCC Pleural Other[0m:  0.94390, [1m[36mtrain_MCC Fracture[0m:  0.95172, [1m[36mtrain_MCC Support Devices[0m:  0.96666, [1m[36mtrain_MCC AVG[0m:  0.95037, [1m[36mtrain_Precision No Finding[0m:  0.93133, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96078, 

100%|██████████| 149/149 [01:02<00:00,  2.39it/s]
100%|██████████| 149/149 [00:33<00:00,  4.44it/s]
100%|██████████| 16/16 [00:04<00:00,  3.79it/s]


[1m[32mepoch[0m:   42, [1m[32mseconds_training_epoch[0m: 62.2239
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.20712, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95642, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94657, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95514, [1m[36mtrain_MCC Lung Opacity[0m:  0.94407, [1m[36mtrain_MCC Lung Lesion[0m:  0.94965, [1m[36mtrain_MCC Edema[0m:  0.94529, [1m[36mtrain_MCC Consolidation[0m:  0.98148, [1m[36mtrain_MCC Pneumonia[0m:  0.99297, [1m[36mtrain_MCC Atelectasis[0m:  0.94217, [1m[36mtrain_MCC Pneumothorax[0m:  0.95239, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95212, [1m[36mtrain_MCC Pleural Other[0m:  0.91565, [1m[36mtrain_MCC Fracture[0m:  0.95838, [1m[36mtrain_MCC Support Devices[0m:  0.97116, [1m[36mtrain_MCC AVG[0m:  0.95453, [1m[36mtrain_Precision No Finding[0m:  0.96930, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.95370, 

100%|██████████| 149/149 [01:02<00:00,  2.38it/s]
100%|██████████| 149/149 [00:33<00:00,  4.48it/s]
100%|██████████| 16/16 [00:05<00:00,  3.17it/s]


[1m[32mepoch[0m:   43, [1m[32mseconds_training_epoch[0m: 62.6271
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.71139, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.98314, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96601, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95779, [1m[36mtrain_MCC Lung Opacity[0m:  0.95050, [1m[36mtrain_MCC Lung Lesion[0m:  0.95611, [1m[36mtrain_MCC Edema[0m:  0.96027, [1m[36mtrain_MCC Consolidation[0m:  0.97774, [1m[36mtrain_MCC Pneumonia[0m:  0.95065, [1m[36mtrain_MCC Atelectasis[0m:  0.95411, [1m[36mtrain_MCC Pneumothorax[0m:  0.95513, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96285, [1m[36mtrain_MCC Pleural Other[0m:  0.95831, [1m[36mtrain_MCC Fracture[0m:  0.93354, [1m[36mtrain_MCC Support Devices[0m:  0.97296, [1m[36mtrain_MCC AVG[0m:  0.95994, [1m[36mtrain_Precision No Finding[0m:  0.98701, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97222, 

100%|██████████| 149/149 [01:01<00:00,  2.42it/s]
100%|██████████| 149/149 [00:34<00:00,  4.32it/s]
100%|██████████| 16/16 [00:04<00:00,  3.35it/s]


[1m[32mepoch[0m:   44, [1m[32mseconds_training_epoch[0m: 61.5038
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.38548, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96400, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95600, [1m[36mtrain_MCC Cardiomegaly[0m:  0.97027, [1m[36mtrain_MCC Lung Opacity[0m:  0.95874, [1m[36mtrain_MCC Lung Lesion[0m:  0.94965, [1m[36mtrain_MCC Edema[0m:  0.97443, [1m[36mtrain_MCC Consolidation[0m:  0.95938, [1m[36mtrain_MCC Pneumonia[0m:  0.97170, [1m[36mtrain_MCC Atelectasis[0m:  0.97102, [1m[36mtrain_MCC Pneumothorax[0m:  0.98054, [1m[36mtrain_MCC Pleural Effusion[0m:  0.97067, [1m[36mtrain_MCC Pleural Other[0m:  0.95831, [1m[36mtrain_MCC Fracture[0m:  0.95222, [1m[36mtrain_MCC Support Devices[0m:  0.96935, [1m[36mtrain_MCC AVG[0m:  0.96473, [1m[36mtrain_Precision No Finding[0m:  0.96567, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97170, 

100%|██████████| 149/149 [01:00<00:00,  2.45it/s]
100%|██████████| 149/149 [00:35<00:00,  4.20it/s]
100%|██████████| 16/16 [00:04<00:00,  3.38it/s]


[1m[32mepoch[0m:   45, [1m[32mseconds_training_epoch[0m: 60.7929
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.80307, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.94479, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.95125, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95959, [1m[36mtrain_MCC Lung Opacity[0m:  0.96240, [1m[36mtrain_MCC Lung Lesion[0m:  0.95051, [1m[36mtrain_MCC Edema[0m:  0.96944, [1m[36mtrain_MCC Consolidation[0m:  0.95938, [1m[36mtrain_MCC Pneumonia[0m:  0.97887, [1m[36mtrain_MCC Atelectasis[0m:  0.94988, [1m[36mtrain_MCC Pneumothorax[0m:  0.96116, [1m[36mtrain_MCC Pleural Effusion[0m:  0.95416, [1m[36mtrain_MCC Pleural Other[0m:  0.95940, [1m[36mtrain_MCC Fracture[0m:  0.99407, [1m[36mtrain_MCC Support Devices[0m:  0.96124, [1m[36mtrain_MCC AVG[0m:  0.96115, [1m[36mtrain_Precision No Finding[0m:  0.94850, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.96262, 

100%|██████████| 149/149 [00:58<00:00,  2.53it/s]
100%|██████████| 149/149 [00:36<00:00,  4.08it/s]
100%|██████████| 16/16 [00:04<00:00,  3.42it/s]


[1m[32mepoch[0m:   46, [1m[32mseconds_training_epoch[0m: 58.9138
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.86843, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.98551, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96569, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95765, [1m[36mtrain_MCC Lung Opacity[0m:  0.94958, [1m[36mtrain_MCC Lung Lesion[0m:  0.94945, [1m[36mtrain_MCC Edema[0m:  0.95397, [1m[36mtrain_MCC Consolidation[0m:  0.95200, [1m[36mtrain_MCC Pneumonia[0m:  0.97887, [1m[36mtrain_MCC Atelectasis[0m:  0.94630, [1m[36mtrain_MCC Pneumothorax[0m:  0.94116, [1m[36mtrain_MCC Pleural Effusion[0m:  0.97557, [1m[36mtrain_MCC Pleural Other[0m:  0.95831, [1m[36mtrain_MCC Fracture[0m:  0.95222, [1m[36mtrain_MCC Support Devices[0m:  0.95582, [1m[36mtrain_MCC AVG[0m:  0.95872, [1m[36mtrain_Precision No Finding[0m:  0.99561, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.99038, 

100%|██████████| 149/149 [00:57<00:00,  2.58it/s]
100%|██████████| 149/149 [00:30<00:00,  4.91it/s]
100%|██████████| 16/16 [00:03<00:00,  4.79it/s]


[1m[32mepoch[0m:   47, [1m[32mseconds_training_epoch[0m: 57.7046
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  4.29911, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96868, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.94657, [1m[36mtrain_MCC Cardiomegaly[0m:  0.94918, [1m[36mtrain_MCC Lung Opacity[0m:  0.95323, [1m[36mtrain_MCC Lung Lesion[0m:  0.93749, [1m[36mtrain_MCC Edema[0m:  0.97191, [1m[36mtrain_MCC Consolidation[0m:  0.96283, [1m[36mtrain_MCC Pneumonia[0m:  0.95796, [1m[36mtrain_MCC Atelectasis[0m:  0.93246, [1m[36mtrain_MCC Pneumothorax[0m:  0.95829, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96383, [1m[36mtrain_MCC Pleural Other[0m:  0.88740, [1m[36mtrain_MCC Fracture[0m:  0.97009, [1m[36mtrain_MCC Support Devices[0m:  0.94049, [1m[36mtrain_MCC AVG[0m:  0.95003, [1m[36mtrain_Precision No Finding[0m:  0.97403, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.95370, 

100%|██████████| 149/149 [00:44<00:00,  3.38it/s]
100%|██████████| 149/149 [00:27<00:00,  5.32it/s]
100%|██████████| 16/16 [00:03<00:00,  4.68it/s]


[1m[32mepoch[0m:   48, [1m[32mseconds_training_epoch[0m: 44.0922
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.63179, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.97096, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96580, [1m[36mtrain_MCC Cardiomegaly[0m:  0.97478, [1m[36mtrain_MCC Lung Opacity[0m:  0.95781, [1m[36mtrain_MCC Lung Lesion[0m:  0.90574, [1m[36mtrain_MCC Edema[0m:  0.95783, [1m[36mtrain_MCC Consolidation[0m:  0.95918, [1m[36mtrain_MCC Pneumonia[0m:  0.97197, [1m[36mtrain_MCC Atelectasis[0m:  0.95583, [1m[36mtrain_MCC Pneumothorax[0m:  0.96402, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96483, [1m[36mtrain_MCC Pleural Other[0m:  0.94502, [1m[36mtrain_MCC Fracture[0m:  0.97615, [1m[36mtrain_MCC Support Devices[0m:  0.97116, [1m[36mtrain_MCC AVG[0m:  0.96008, [1m[36mtrain_Precision No Finding[0m:  0.98246, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.98113, 

100%|██████████| 149/149 [00:44<00:00,  3.36it/s]
100%|██████████| 149/149 [00:27<00:00,  5.38it/s]
100%|██████████| 16/16 [00:03<00:00,  4.68it/s]


[1m[32mepoch[0m:   49, [1m[32mseconds_training_epoch[0m: 44.4002
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.77892, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.96851, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96601, [1m[36mtrain_MCC Cardiomegaly[0m:  0.95327, [1m[36mtrain_MCC Lung Opacity[0m:  0.95324, [1m[36mtrain_MCC Lung Lesion[0m:  0.91245, [1m[36mtrain_MCC Edema[0m:  0.96165, [1m[36mtrain_MCC Consolidation[0m:  0.93634, [1m[36mtrain_MCC Pneumonia[0m:  0.96476, [1m[36mtrain_MCC Atelectasis[0m:  0.95176, [1m[36mtrain_MCC Pneumothorax[0m:  0.96942, [1m[36mtrain_MCC Pleural Effusion[0m:  0.97068, [1m[36mtrain_MCC Pleural Other[0m:  0.95831, [1m[36mtrain_MCC Fracture[0m:  0.94026, [1m[36mtrain_MCC Support Devices[0m:  0.95856, [1m[36mtrain_MCC AVG[0m:  0.95466, [1m[36mtrain_Precision No Finding[0m:  0.98238, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.97222, 

100%|██████████| 149/149 [00:44<00:00,  3.34it/s]
100%|██████████| 149/149 [00:27<00:00,  5.44it/s]
100%|██████████| 16/16 [00:03<00:00,  4.63it/s]


[1m[32mepoch[0m:   50, [1m[32mseconds_training_epoch[0m: 44.5969
	[1m[32mTRAIN RESULTS: [0m[1m[36mtrain_Loss[0m:  3.80109, [1m[36mtrain_Num Samples[0m:  2234.00000, [1m[36mtrain_MCC No Finding[0m:  0.95671, [1m[36mtrain_MCC Enlarged Cardiomediastinum[0m:  0.96569, [1m[36mtrain_MCC Cardiomegaly[0m:  0.97459, [1m[36mtrain_MCC Lung Opacity[0m:  0.94131, [1m[36mtrain_MCC Lung Lesion[0m:  0.93749, [1m[36mtrain_MCC Edema[0m:  0.97443, [1m[36mtrain_MCC Consolidation[0m:  0.93373, [1m[36mtrain_MCC Pneumonia[0m:  0.92993, [1m[36mtrain_MCC Atelectasis[0m:  0.94616, [1m[36mtrain_MCC Pneumothorax[0m:  0.96646, [1m[36mtrain_MCC Pleural Effusion[0m:  0.96872, [1m[36mtrain_MCC Pleural Other[0m:  0.95831, [1m[36mtrain_MCC Fracture[0m:  0.95190, [1m[36mtrain_MCC Support Devices[0m:  0.96396, [1m[36mtrain_MCC AVG[0m:  0.95496, [1m[36mtrain_Precision No Finding[0m:  0.96121, [1m[36mtrain_Precision Enlarged Cardiomediastinum[0m:  0.99038, 

In [None]:
# MODELS = {
#     ('effnetv2', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_effnetv2(pretrain, int(in_ch), int(out_ch))),
#     ('resnet50', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_resnet('resnet50', pretrain, int(in_ch), int(out_ch))),
#     ('resnet18', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_resnet('resnet18', pretrain, int(in_ch), int(out_ch))),
#     ('efficientnet-b0', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_efficientnetv1('efficientnet-b0', pretrain, int(in_ch), int(out_ch))),
#     ('efficientnet-b1', str, str, str): (
#         lambda pretrain, in_ch, out_ch: get_efficientnetv1('efficientnet-b1', pretrain, int(in_ch), int(out_ch))),
#     ('waveletres18', str, str, str): lambda pretrain, in_ch, out_ch: R(
#         pretrain, int(in_ch), int(out_ch)),
#     ('waveletmlp', str, str, str, str, str, str, str): (
#         lambda mlp_channels, in_ch, out_ch, wavelet_levels, patch_size, in_ch_mul, mlp_depth: get_DeepFixEnd2End(
#             int(in_ch), int(out_ch),
#             in_ch_multiplier=int(in_ch_mul), wavelet='db1',
#             wavelet_levels=int(wavelet_levels), wavelet_patch_size=int(patch_size),
#             mlp_depth=int(mlp_depth), mlp_channels=int(mlp_channels),
#             mlp_fix_weights='none', mlp_activation=None)
#         ),

#     #  ('waveletres18v2', str, str, str): lambda pretrain, in_ch, out_ch: (
#         #  DeepFixCompression(levels=8, wavelet='coif1', patch_size=1),
#         #  R2(pretrain, int(in_ch), int(out_ch))),
# }


# class R(T.nn.Module):
#     def __init__(self, pretrain, in_ch, out_ch):
#         super().__init__()
#         self.r = get_resnet('resnet18', pretrain, in_ch, out_ch,)
#         self.dwt = pyw.DWT(J=8, wave='coif1', mode='zero')

#     @staticmethod
#     def wavelet_coefficients_as_tensorimage(approx, detail, normalize=False):
#         B,C = approx.shape[:2]
#         fixed_dims = approx.shape[:-2] # num images in minibatch, num channels, etc
#         output_shape = fixed_dims + (
#             detail[0].shape[-2]*2,  # input img height
#             detail[0].shape[-1]*2)  # input img width
#         im = T.zeros(output_shape, device=approx.device, dtype=approx.dtype)
#         if normalize:
#             norm11 = lambda x: (x / max(x.min()*-1, x.max()))  # into [-1,+1] preserving sign
#             #  approx = norm11(approx)
#         im[..., :approx.shape[-2], :approx.shape[-1]] = approx if approx is not None else 0
#         for level in detail:
#             lh, hl, hh = level.unbind(-3)
#             h,w = lh.shape[-2:]
#             if normalize:
#                 lh, hl, hh = [norm11(x) for x in [lh, hl, hh]]
#             #  im[:h, :w] = approx
#             im[..., 0:h, w:w+w] = lh  # horizontal
#             im[..., h:h+h, :w] = hl  # vertical
#             im[..., h:h+h, w:w+w] = hh  # diagonal
#         return im

#     def forward(self, x):
#         x = self.wavelet_coefficients_as_tensorimage(*self.dwt(x))
#         return self.r(x)


# class R2(T.nn.Module):
#     def __init__(self, pretrain, in_ch, out_ch):
#         super().__init__()
#         self.r = get_resnet('resnet18', pretrain, in_ch, out_ch,)

#     def forward(self, x):
#         B,C,H = x.shape
#         x = x.unsqueeze(-1).repeat(1,1,1,H)
#         return self.r(x)


# class LossCheXpertIdentity(T.nn.Module):
#     def __init__(self, N):
#         super().__init__()
#         self.bce = T.nn.BCEWithLogitsLoss()
#         self.N = N

#     def forward(self, yhat, y):
#         # absolute max possible num patients in chexpert is 223414
#         # but let's just hash them into a smaller number of bins via modulo N
#         assert self.N == yhat.shape[1], \
#                 f'note: model must have {self.N} binary predictions per sample'
#         y_onehot = y.new_zeros(y.shape[0], self.N, dtype=T.float
#                                ).scatter_(1, y.long()%self.N, 1)
#         return self.bce(yhat[:, -1], y_onehot[:, -1])


# class LossCheXpertUignore(T.nn.Module):
#     def __init__(self):
#         super().__init__()
#         self.bce = T.nn.BCEWithLogitsLoss()

#     def forward(self, yhat, y):
#         ignore = (y != 2)  # ignore uncertainty labels
#         return self.bce(yhat[ignore], y[ignore])


# def loss_intelmobileodt(yhat, y):
#     """BCE Loss with class balancing weights.

#     Not sure this actually helps

#     because Type 2 is the hardest class, it
#     has the most samples, and it separates Type 1 from Type 3.  Arguably, Type 2
#     samples are on the decision boundary between Type 1 and 3.
#     Class balancing weights make it harder to focus on class 2.
#     """
#     #  assert y.shape == yhat.shape, 'sanity check'
#     #  assert y.dtype == yhat.dtype, 'sanity check'

#     # class distribution of stage='train'
#     w = T.tensor([249, 781, 450], dtype=y.dtype, device=y.device)
#     w = (w.max() / w).reshape(1, 3)
#     # w can have any of the shapes:  (B,1) or (1,C) or (B,C)
#     #  return T.nn.functional.binary_cross_entropy_with_logits(yhat, y, weight=w)
#     return T.nn.functional.cross_entropy(yhat, y, weight=w)
#     # can't apply focal loss unless do it manually.


# def onehot(y, nclasses):
#     return T.zeros((y.numel(), nclasses), dtype=y.dtype, device=y.device)\
#             .scatter_(1, y.unsqueeze(1), 1)


# def _upsample_pad_minibatch_imgs_to_same_size(batch, target_is_segmentation_mask=False):
#     """a collate function for a dataloader of (x,y) samples.  """
#     shapes = [item[0].shape for item in batch]
#     H = max(h for c,h,w in shapes)
#     W = max(w for c,h,w in shapes)
#     X, Y = [], []
#     for item in batch:
#         h,w = item[0].shape[1:]
#         dh, dw = (H-h), (W-w)
#         padding = (dw//2, dw-dw//2, dh//2, dh-dh//2, )
#         X.append(T.nn.functional.pad(item[0], padding))
#         if target_is_segmentation_mask:
#             Y.append(T.nn.functional.pad(item[1], padding))
#         else:
#             Y.append(item[1])
#     return T.stack(X), T.stack(Y)


# def get_dset_chexpert(train_frac=.8, val_frac=.2, small=False,
#                       labels:str='diagnostic', num_identities=None):
#     """
#     Args:
#         labels:  either "diagnostic" (the 14 classes defined as
#             D.CheXpert.LABELS_DIAGNOSTIC) or "identity" ("patient", "study",
#             "view", "index")
#         small:  whether to use CheXpert_Small dataset (previously downsampled
#             images) or the fully size dataset.
#         num_identities:  used only if labels='identity'.  If
#             num_identities=1000, then all patients get identified as coming
#             from precisely 1 of 1000 bins.

#     Returns:
#         (
#         {'train_dset': ..., 'val_dset': ..., 'test_dset': ...,
#          'train_loader': ..., 'val_loader': ..., 'test_loader': ...
#          },

#         ('Pneumonia', 'Cardiomegaly', ...)  # class names defined by `labels`
#         )
#     """
#     _label_cleanup_dct = dict(D.CheXpert.LABEL_CLEANUP_DICT)
#     if labels == 'diagnostic':
#         class_names = D.CheXpert.LABELS_DIAGNOSTIC
#         for k in class_names:
#             _label_cleanup_dct[k][np.nan] = 0  # remap missing value to negative
#         get_ylabels = lambda dct: \
#                 D.CheXpert.format_labels(dct, labels=class_names).float()
#     elif labels == 'identity':
#         class_names = list(range(num_identities))
#         get_ylabels = lambda dct: \
#                 (D.CheXpert.format_labels(dct, labels=['index']) % num_identities).long()
#     else:
#         raise NotImplementedError(f"unrecognized labels: {labels}")
#     kws = dict(
#         img_transform=tvt.Compose([
#             #  tvt.RandomCrop((512, 512)),
#             tvt.ToTensor(),  # full res 1024x1024 imgs
#         ]),
#         getitem_transform=lambda dct: (dct['image'], get_ylabels(dct)),
#         label_cleanup_dct=_label_cleanup_dct,
#     )
#     if small:
#         kls = D.CheXpert_Small
#     else:
#         kls = D.CheXpert

#     train_dset = kls(dataset_dir="../data/CheXpert-v1.0-small/",use_train_set=True, **kws)  #Edited Elvin

#     N = len(train_dset)
#     if train_frac + val_frac == 1:
#         nsplits = [N - int(N*val_frac), int(N*val_frac), 0]
#     else:
#         a,b = int(N*train_frac), int(N*val_frac)
#         nsplits = [a,b, N-a-b]
#     train_dset, val_dset, _ = T.utils.data.random_split(train_dset, nsplits)
#     test_dset = kls(dataset_dir="../data/CheXpert-v1.0-small/",use_train_set=False, **kws) #Edited Elvin
#     batch_dct = dict(
#         batch_size=15, collate_fn=_upsample_pad_minibatch_imgs_to_same_size,
#         num_workers=int(os.environ.get("num_workers", 4)))  # upsample pad must take time
#     train_loader=DataLoader(train_dset, shuffle=True, **batch_dct)
#     val_loader=DataLoader(val_dset, **batch_dct)
#     test_loader=DataLoader(test_dset, **batch_dct)
#     return (dict(
#         train_dset=train_dset, val_dset=val_dset, test_dset=test_dset,
#         train_loader=train_loader, val_loader=val_loader, test_loader=test_loader,
#     ), class_names)


# def get_dset_intel_mobileodt(stage_trainval:str, use_val:str, stage_test:str, augment:str
#                              ) -> (dict[str,Optional[Union[Dataset,DataLoader]]], tuple[str]):
#     """Obtain train/val/test splits for the IntelMobileODT Cervical Cancer
#     Colposcopy dataset, and the data loaders.

#     Args:
#         stage_trainval: the `stage` for training and validation.
#             i.e. Possible choices:  {'train', 'train+additional'}
#             Train / val split is 70/30 random stratified split.
#         use_val: Whether to create a validation set
#             Choices:  {"val", "noval"}
#         stage_test: the `stage` for test set.  Should be "test".
#         augment: Type of augmentations to apply.  One of {'v1', }.
#             "v1" - make the aspect ratio .75, resize images to (200,150), and convert in range [0,1]
#     Returns:
#         (
#         {'train_dset': ..., 'val_dset': ..., 'test_dset': ...,
#          'train_loader': ..., 'val_loader': ..., 'test_loader': ...
#          },

#         ('Type 1', 'Type 2', 'Type 3')
#         )
#     """
#     assert augment == 'v1', 'code bug: other augmentations not implemented'
#     base_dir = './data/intel_mobileodt_cervical_resized'
#     dset_trainval = D.IntelMobileODTCervical(stage_trainval, base_dir)
#     _y = [dset_trainval.getitem(i, load_img=False)
#           for i in range(len(dset_trainval))]
#     dct = {'test_dset': D.IntelMobileODTCervical(stage_test, base_dir)}
#     if use_val == 'noval':
#         dct['train_dset'] = dset_trainval
#         dct['val_dset'] = None
#     else:
#         assert use_val == 'val', f'unrecognized option: {use_val}'
#         idxs_train, idxs_val = list(
#             StratifiedShuffleSplit(1, test_size=.3).split(
#                 np.arange(len(dset_trainval)), _y))[0]
#         dct['train_dset'] = T.utils.data.Subset(dset_trainval, idxs_train)
#         dct['val_dset'] = T.utils.data.Subset(dset_trainval, idxs_val)

#     # preprocess train/val/test images all the same way
#     preprocess_v1 = tvt.Compose([
#         #
#         ### previously done (to save computation time) ###
#         #  D.IntelMobileODTCervical.fix_aspect_ratio,
#         #  tvt.Resize((200, 150)),  # interpolation=tvt.InterpolationMode.NEAREST),
#         #
#         lambda x: x.float()/255.
#     ])
#     dct = {k: D.PreProcess(v, lambda xy: (
#         preprocess_v1(xy[0]),
#         #  onehot(xy[1].unsqueeze(0).long()-1, 3).squeeze_().float()))
#         xy[1].long()-1))
#         for k,v in dct.items()}
#     dct.update(dict(
#         train_loader=DataLoader(dct['train_dset'], batch_size=20, shuffle=True),
#         test_loader=DataLoader(dct['test_dset'], batch_size=20),))
#     if dct['val_dset'] is None:
#         dct['val_loader'] = None
#     else:
#         dct['val_loader'] = DataLoader(dct['val_dset'], batch_size=20)
#     class_names = [x.replace('_', ' ') for x in D.IntelMobileODTCervical.LABEL_NAMES]
#     return dct, class_names


# LOSS_FNS = {
#     ('BCEWithLogitsLoss', ): lambda _: T.nn.BCEWithLogitsLoss(),
#     ('CrossEntropyLoss', ): lambda _: T.nn.CrossEntropyLoss(),
#     ('CE_intelmobileodt', ): lambda _: loss_intelmobileodt,
#     ('chexpert_uignore', ): lambda _: LossCheXpertUignore(),
#     ('chexpert_identity', str): lambda out_ch: LossCheXpertIdentity(N=int(out_ch)),
# }

# DSETS = {
#     ('intel_mobileodt', str, str, str, str): (
#         lambda train, val, test, aug: get_dset_intel_mobileodt(train, val, test, aug)),
#     #  ('origa', ... todo): ( lambda ...: get_dset_origa(...)
#     #  ('riga', ... todo): ( lambda ...: get_dset_riga(...)
#     ('chexpert', str, str): (
#         lambda train_frac, val_frac: get_dset_chexpert(
#             float(train_frac), float(val_frac), small=False, labels='diagnostic')),
#     ('chexpert_small', str, str): (
#         lambda train_frac, val_frac: get_dset_chexpert(
#             float(train_frac), float(val_frac), small=True, labels='diagnostic')),
#     ('chexpert_small_ID', str, str, str): (
#         lambda num_identities, train_frac, val_frac: get_dset_chexpert(
#             float(train_frac), float(val_frac), small=True,
#             labels='identity', num_identities=int(num_identities))),
# }


# def match(spec:str, dct:dict):
#     return pampy.match(spec.split(':'), *(x for y in dct.items() for x in y))


# def get_model_opt_loss(
#         model_spec:str, opt_spec:str, loss_spec:str, regularizer_spec:str,
#         device:str) -> dict[str, Union[T.nn.Module, T.optim.Optimizer]]:
#     """
#     Args:
#         model_spec: a string of form,
#             "model_name:pretraining:in_channels:out_classes".  For example:
#             "effnetv2:untrained:1:5"
#         opt_spec: Specifies how to create optimizer.
#             First value is a pytorch Optimizer in T.optim.*.
#             Other values are numerical parameters.
#             Example: "SGD:lr=.003:momentum=.9"
#         device: e.g. 'cpu' or 'gpu'
#     Returns:
#         a pytorch model and optimizer
#     """
#     mdl = match(model_spec, MODELS)
#     mdl = mdl.to(device, non_blocking=True)
#     optimizer = reset_optimizer(opt_spec, mdl)
#     loss_fn = match(loss_spec, LOSS_FNS)
#     if regularizer_spec != 'none':
#         loss_fn = RegularizedLoss(mdl, loss_fn, regularizer_spec)
#     return dict(model=mdl, optimizer=optimizer, loss_fn=loss_fn)


# class RegularizedLoss(T.nn.Module):
#     def __init__(self, model, lossfn, regularizer_spec:str):
#         super().__init__()
#         self.lossfn = lossfn
#         self.regularizer_spec = regularizer_spec
#         if regularizer_spec == 'none':
#             self.regularizer = lambda *y: 0
#         elif regularizer_spec.startswith('deepfixmlp:'):
#             lbda = float(regularizer_spec.split(':')[1])
#             self.regularizer = lambda *y: (
#                 float(lbda) * DeepFixMLP.get_VecAttn_regularizer(model))
#         else:
#             raise NotImplementedError(regularizer_spec)

#     def forward(self, yhat, y):
#         return self.lossfn(yhat, y) + self.regularizer(yhat, y)

#     def __repr__(self):
#         return f'RegularizedLoss<{repr(self.lossfn)},{self.regularizer_spec}>'


# def get_dset_loaders_resultfactory(dset_spec:str) -> dict:
#     dct, class_names = match(dset_spec, DSETS)
#     if any(dset_spec.startswith(x) for x in {'intel_mobileodt:',
#                                              'chexpert_small_ID:'}):
#         #  dct['result_factory'] = lambda: TL.MultiLabelBinaryClassification(
#                 #  class_names, binarize_fn=lambda yh: (T.sigmoid(yh)>.5).long())
#         dct['result_factory'] = lambda: TL.MultiClassClassification(
#                 len(class_names), binarize_fn=lambda yh: yh.softmax(1).argmax(1))
#     elif any(dset_spec.startswith(x) for x in {'chexpert:', 'chexpert_small:'}):
#         dct['result_factory'] = lambda: CheXpertMultiLabelBinaryClassification(
#             class_names, binarize_fn=lambda yh: (yh.sigmoid()>.5).long(), report_avg=True)
#     else:
#         raise NotImplementedError(f"I don't know how to create the result factory for {dset_spec}")
#     return dct

# class CheXpertMultiLabelBinaryClassification(TL.MultiLabelBinaryClassification):
#     def update(self, yhat, y, loss) -> None:
#         self.num_samples += yhat.shape[0]
#         self.loss += loss.item()
#         assert yhat.shape == y.shape
#         assert yhat.ndim == 2 and yhat.shape[1] == len(self._cms), "sanity check: model outputs expected prediction shape"
#         binarized = self._binarize_fn(yhat)
#         assert binarized.dtype == T.long, 'sanity check binarize fn'
#         assert binarized.shape == y.shape, 'sanity check binarize fn'
#         ignore = (y != 2)  # ignore uncertainty labels
#         for i, (kls, cm) in enumerate(self._cms.items()):
#             rows = ignore[:, i]
#             if rows.sum() == 0:
#                 continue  # don't update a confusion matrix if all data for this class is ignored
#             cm += metrics.confusion_matrix(y[rows, i], binarized[rows, i], num_classes=2).cpu()


# def get_deepfix_train_strategy(args:'TrainOptions'):
#     deepfix_spec = args.deepfix
#     if deepfix_spec == 'off':
#         return TL.train_one_epoch
#     elif deepfix_spec.startswith('reinit:'):
#         _, N, P, R = deepfix_spec.split(':')
#         return dfs.DeepFix_TrainOneEpoch(int(N), float(P), int(R), TL.train_one_epoch)
#     elif deepfix_spec.startswith('dhist:'):
#         fp = deepfix_spec.split(':', 1)[1]
#         assert exists(fp), f'histogram file not found: {fp}'
#         return dfs.DeepFix_DHist(fp)
#     elif deepfix_spec.startswith('dfhist:'):
#         fp = deepfix_spec.split(':', 1)[1]
#         assert exists(fp), f'histogram file not found: {fp}'
#         return dfs.DeepFix_DHist(fp, fixed=True)
#     elif deepfix_spec == 'fixed':
#         return dfs.DeepFix_DHist('', fixed=True, init_with_hist=False)
#     elif deepfix_spec.startswith('beta:'):
#         alpha, beta = deepfix_spec.split(':')[1:]
#         return dfs.DeepFix_LambdaInit(
#             lambda cfg: init_from_beta(cfg.model, float(alpha), float(beta)))
#     elif deepfix_spec.startswith('ghaarconv2d:'):
#         ignore_layers = deepfix_spec.split(':')[1].split(',')
#         return dfs.DeepFix_LambdaInit(
#             lambda cfg: (
#                 print(f'initialize {deepfix_spec}'),
#                 convert_conv2d_to_gHaarConv2d(cfg.model, ignore_layers=ignore_layers),
#                 reset_optimizer(args.opt, cfg.model),
#                 print(cfg.model)
#             ))
#     else:
#         raise NotImplementedError(deepfix_spec)


# def train_config(args:'TrainOptions') -> TL.TrainConfig:
#     return TL.TrainConfig(
#         **get_model_opt_loss(
#             args.model, args.opt, args.lossfn, args.loss_reg, args.device),
#         **get_dset_loaders_resultfactory(args.dset),
#         device=args.device,
#         epochs=args.epochs,
#         start_epoch=args.start_epoch,
#         train_one_epoch=get_deepfix_train_strategy(args),
#         experiment_id=args.experiment_id,
#     )


# @dc.dataclass
# class TrainOptions:
#     """High-level configuration for training PyTorch models
#     on the IntelMobileODTCervical dataset.
#     """
#     epochs:int = 50
#     start_epoch:int = 0  # if "--start_epoch 1", then don't evaluate perf before training.
#     device:str = 'cuda' if T.cuda.is_available() else 'cpu'
#     dset:str = None #choice(
#         #  'intel_mobileodt:train:val:test:v1',
#         #  'intel_mobileodt:train+additional:val:test:v1',
#         #  'intel_mobileodt:train+additional:noval:test:v1',
#         #  'chexpert:.8:.2', 'chexpert:.01:.01', 'chexpert:.001:.001',
#         #  'chexpert_small:.8:.2', 'chexpert_small:.01:.01',
#         #   'chexpert_small:.001:.001',
#         #  default='intel_mobileodt:train:val:test:v1')
#     opt:str = 'SGD:lr=.001:momentum=.9:nesterov=1'
#     lossfn:str = None  # choices:
#         #  'BCEWithLogitsLoss',
#         #  'CrossEntropyLoss', 
#         #  'CE_intelmobileodt',
#         #  'chexpert_uignore', 
#         #  'chexpert_identity:N' for some N=num_identities predicted by model (compared to identities y%N)
#     loss_reg:str = 'none'  # Optionally add a regularizer to the loss.  loss + reg.  Accepted values:  'none', 'deepfixmlp:X' where X is a positive float denoting the lambda in l1 regularizer
#     model:str = 'resnet18:imagenet:3:3'  # Model specification adheres to the template "model_name:pretraining:in_ch:out_ch"
#     deepfix:str = 'off'  # DeepFix Re-initialization Method.
#                          #  "off" or "reinit:N:P:R" or "d[f]hist:path_to_histogram.pth"
#                          #  or "beta:A:B" for A,B as (float) parameters of the beta distribution
#                          # 'ghaarconv2d:layer1,layer2' Replaces all spatial convolutions with GHaarConv2d layer except the specified layers
#     experiment_id:str = os.environ.get('run_id', 'debugging')
#     prune:str = 'off'

#     def execute(self):
#         cfg = train_config(self)
#         cfg.train(cfg)


# def main():
#     p = ArgumentParser()
#     p.add_arguments(TrainOptions, dest='TrainOptions')

# #     args = p.parse_args(["--dset", "chexpert_small:.01:.01", "--opt", "Adam:lr=0.001", "--lossfn", "chexpert_uignore", "--model", "waveletmlp:300:1:14:7:1:1:2", "--loss_reg", "none"]).TrainOptions

#     print(args)
#     cfg = train_config(args)
    
# # python deepfix/train.py --dset chexpert_small:.01:.01 --opt Adam:lr=0.001 --lossfn chexpert_uignore --model waveletmlp:300:1:14:7:1:1:2 --loss_reg none    
    
#     if args.prune != 'off':
#         assert args.prune.startswith('ChannelPrune:')
#         raise NotImplementedError('code is a bit hardcoded, so it is not available without hacking on it.')
#         print(args.prune)
#         from explainfix import channelprune
#         from deepfix.weight_saliency import costfn_multiclass
#         a = sum([x.numel() for x in cfg.model.parameters()])
#         channelprune(cfg.model, pct=5, grad_cost_fn=costfn_multiclass,
#                      loader=cfg.train_loader, device=cfg.device, num_minibatches=10)
#         b = sum([x.numel() for x in cfg.model.parameters()])
#         assert a/b != 1
#         print(f'done channelpruning.  {a/b}')

#     cfg.train(cfg)
#     #  import IPython ; IPython.embed() ; import sys ; sys.exit()

#     #  with T.profiler.profile(
#     #      activities=[
#     #          T.profiler.ProfilerActivity.CPU,
#     #          T.profiler.ProfilerActivity.CUDA,
#     #      ], with_modules=True,
#     #  ) as p:
#     #      cfg.train(cfg)
#     #  print(p.key_averages().table(
#     #      sort_by="self_cuda_time_total", row_limit=-1))


# if __name__ == "__main__":
#     main()


In [4]:
# os.getcwd()
# !ls

In [4]:
# args = {}
# args['dset'] = 'chexpert_small:.01:.01'
# args['opt'] = 'Adam:lr=0.001'
# args['lossfn'] = 'chexpert_uignore'
# args['model'] = 'waveletmlp:300:1:14:7:1:1:2'
# args['loss_reg'] = None
# args['prune'] = 'off'

In [9]:
# args.dset

In [21]:
# import pandas as pd

In [23]:
# t = pd.read_csv('../data/CheXpert-v1.0-small/train.csv')