This notebook computes all of the "distances" (the fuzzy logic scores for IOU, DICE, ...) between the GradCam maps produced by the final models and the visual characterstics maps created by the dermatologists. That is: 

```
for each image i  
  for each GradCam image i_gc  
    for each dermatologist d  
      for each characteristic d_char  
        compute the visual distance between i_gc and d_char 
```


In [122]:
%matplotlib inline
import pandas as pd
import numpy as np
from pathlib import Path
from collections import defaultdict
import matplotlib.pyplot as plt 
from PIL import Image
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)


In [39]:
classes = [
    "Acne",
    "Actinic keratosis",
    "Psoriasis",
    "Seborrheic dermatitis",
    "Viral warts",
    "Vitiligo"
]

derms = [
    'derm1',
    'derm2',
    'derm3',
    'derm4',
    'derm5',
    'derm6',
    'derm7',
    'derm8',
]

characteristics = [
    'Closed comedo',
    'Cyst',
    'Dermatoglyph disruption',
    'Leukotrichia',
    'Macule',
    'Nodule',
    'Open comedo',
    'Papule',
    'Patch',
    'Plaque',
    'Pustule',
    'Scale',
    'Scar',
    'Sun damage',
    'Telangiectasia',
    'Thrombosed capillaries'
]

images_path = Path('/home/ubuntu/hot-store/dermx/all_images')
masks_path = Path('/home/ubuntu/hot-store/dermx_masks/per_image')
results_path = Path('/home/ubuntu/hot-store/final/')
columns = [
         'filename',
         'gradcam_class',
         'iou',
         'dice',
         'precision',
         'recall',
         'negative_predictive_value',
         'specificity'
    ]


# Metrics supporting probabilistic segmentation maps
fuzzy_and = lambda x,y: np.minimum(x,y)
fuzzy_or = lambda x,y: np.maximum(x,y)
fuzzy_not = lambda x: 1-x

def pixel_metrics_fuzzy(y_true, y_pred):
    """
    Pixel-level metrics of segmentation accuracy following fuzzy logic operators.
    
    :param y_true: numpy.ndarray of reference segmentation, values in [0,1]
    :param y_pred: numpy.ndarray of predicted segmentation, values in [0,1]

    :return: a dictionary encoding the metrics
    """
        
    np.testing.assert_equal(y_true.shape, y_pred.shape, err_msg="Expecting \
    the reference and predicted segmentations to be of the same size.")
    
    # Check the ranges
    np.testing.assert_equal(np.logical_and(y_true >= 0, y_true <= 1).all(), True, err_msg="Expecting \
    the reference segmentations to be in the range 0 to 1.")
    np.testing.assert_equal(np.logical_and(y_pred >= 0, y_pred <= 1).all(), True, err_msg="Expecting \
    the predicted segmentations to be in the range 0 to 1.")
    
    TP = fuzzy_and(y_true, y_pred).sum()
    TN = fuzzy_and(fuzzy_not(y_true), fuzzy_not(y_pred)).sum()
    union = fuzzy_or(y_true, y_pred).sum()
    
    metrics = {}
    
    # Summary metrics
    metrics["iou"] = TP / union
    metrics["dice"] = 2 * TP / ( y_true.sum() + y_pred.sum() ) 
    
    # Positive class metrics
    metrics["precision"] = TP / y_pred.sum()
    metrics["recall"] = TP / y_true.sum()
    
    # Negative class metrics
    metrics["negative_predictive_value"] = TN / fuzzy_not(y_pred).sum()
    metrics["specificity"] = TN / fuzzy_not(y_true).sum()
    
    return metrics


def calculate_mask_metrics(gradcam_path, mask_path, interpolation_method=Image.NEAREST):
    """
    Calculates the fuzzy logic metrics given the paths to a pair of input images.
    The derm mask is resized to match the size of the gradcam image.
    
    Input:
    - gradcam_image_path: Pathlib path to a gradCam image. The file is assumed to be in .npy format.
    - derm_char_mask_path: Pathlib path to a derm annotation. The file is assumed to be in a format that can
                           be opened by PIL.
    - interpolation_method: String. The method used for interpolation when resizing the derm mask. Options are
                            NEAREST, BOX, BILINEAR, HAMMING, BICUBIC, LANCZOS. Default is NEAREST.    
    """
    
    # Open images.
    gradcam = np.load(gradcam_path, allow_pickle=True)
    mask = Image.open(mask_path)
    
    # Resize the derm mask if its size does not match the size of the gradcam image.
    if gradcam.shape != mask.size[::-1]:
        # Note that resize uses (cols, rows) format, while .shape is in (rows, cols) format.
        mask = mask.resize((gradcam.shape[::-1]), interpolation_method)
    
    # Convert the derm mask to numpy format and normalize to [0, 1].
    mask = np.asarray(mask) / 255

    return pixel_metrics_fuzzy(mask, gradcam)


## Per image metrics

In [22]:
def get_per_image_metrics(results_path, model_name, images_path, masks_path, classes, columns):
    gradcams_path = results_path / 'visualisation/gradcam' / model_name
    model_path = results_path / model_name
    
    derm_mask_paths = [mask_path for mask_path in masks_path.iterdir() if mask_path.suffix == '.png']
    image_paths = [image_path for image_path in images_path.rglob('*.jpeg')]

    # For each image in the test set, calculate the value of the defined metrics given the GradCam image for a given
    # class and the outline made by a specific derm for a given characteristic. The result is stored in a defaultdict.
    # As a sanity check, the number of matches between GradCam images and derm annotations is also calculated.
    metrics_list = []

    # Set the method used for interpolation when resizing the derm annotations.
    interpolation = Image.NEAREST

    # Compute metrics for each image
    for image_path in image_paths:
        for diagnosis in classes:
            # Check if matching GradCam file exists.
            gradcam_path = gradcams_path / Path(image_path.stem + '_' + diagnosis + '.npy')
            if gradcam_path.is_file():
                mask_path = masks_path / Path(image_path.stem + '.png') 
                if mask_path.is_file():
                    # Calculate the value of the metics given the GradCam image and the derm mask.
                    gradcam_metric_val = calculate_mask_metrics(gradcam_path, mask_path, interpolation)
                    gradcam_metric_val['gradcam_class'] = diagnosis 
                    gradcam_metric_val['filename'] = image_path.stem 
                    metrics_list.append(gradcam_metric_val)
            else:
                print(f'GradCam file missing for image {image_path}')
                
    return pd.DataFrame.from_records(metrics_list, columns=columns)


In [23]:
def analyse_per_image_gradcam(
    results_path, 
    model_name, 
    images_path, 
    masks_path, 
    preds_name,
    columns,
    classes,
):
    per_image_metrics_df = get_per_image_metrics(results_path, model_name, images_path, masks_path, classes, columns)
    
    preds_df = pd.read_csv(results_path / preds_name)
    preds_df['filename'] = [filename.split('/')[1].split('.')[0] for filename in preds_df.filename.values]
    preds_df = preds_df.merge(per_image_metrics_df, left_on='filename', right_on='filename')
    # Keep only correct predictions
    preds_df = preds_df[preds_df['actual'] == preds_df['pred']]
    preds_df = preds_df[preds_df['pred_class'] == preds_df['gradcam_class']]
    
    return {
        'iou': preds_df['iou'].mean(),
        'dice': preds_df['dice'].mean(),
        'precision': preds_df['precision'].mean(),
        'recall': preds_df['recall'].mean(),
        'negative_predictive_value': preds_df['negative_predictive_value'].mean(),
        'specificity': preds_df['specificity'].mean(), 
    }


In [25]:
model_info = [
    {
        'model_name': 'efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_',
        'model_architecture': 'efficientnet',
    },
    {
        'model_name': 'inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_',
        'model_architecture': 'inception',
    },
    {
        'model_name': 'inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_',
        'model_architecture': 'inceptionresnet',
    },
    {
        'model_name': 'mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_',
        'model_architecture': 'mobilenetv1',
    },
    {
        'model_name': 'mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_',
        'model_architecture': 'mobilenetv2',
    },
    {
        'model_name': 'nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_',
        'model_architecture': 'nasnetmobile',
    },
    {
        'model_name': 'resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_',
        'model_architecture': 'resnet',
    },
    {
        'model_name': 'resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_',
        'model_architecture': 'resnetv2',
    },
    {
        'model_name': 'vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_',
        'model_architecture': 'vgg',
    },
    {
        'model_name': 'xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_', 
        'model_architecture': 'xception',
    }
]

models_performance = []
for model in model_info:
    for idx in range(5):
        model_results_path = results_path / model['model_architecture']
        model_name = f'{model["model_name"]}{idx}'
        preds_name = f'dermx_{idx}_preds.csv'
        print(model_name)
        model_performance = analyse_per_image_gradcam(model_results_path, model_name, images_path, masks_path, preds_name, columns, classes)
        model_performance['model_architecture'] = model['model_architecture']
        model_performance['model_name'] = model['model_name']
        models_performance.append(model_performance)
models_performance_df = pd.DataFrame.from_records(models_performance, columns=models_performance[0].keys())   

efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_0




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_1




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_2




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_3




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_4




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_0




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_1




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_2




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_3




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_4




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_0




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_1




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_2




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_3




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_4




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_0




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_1




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_2




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_3




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_4




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_0




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_1




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_2




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_3




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_4




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_0




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_1




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_2




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_3




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_4




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_0




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_1




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_2




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_3




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_4




resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_0
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_1
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_2




resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_3
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_4
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_0
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_1
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_2




vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_3




vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_4




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_0




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_1




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_2




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_3




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_4




In [29]:
models_performance_df.groupby('model_architecture').describe()

Unnamed: 0_level_0,iou,iou,iou,iou,iou,iou,iou,iou,dice,dice,dice,dice,dice,dice,dice,dice,precision,precision,precision,precision,precision,precision,precision,precision,recall,recall,recall,recall,recall,recall,recall,recall,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,specificity,specificity,specificity,specificity,specificity,specificity,specificity,specificity
Unnamed: 0_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max
model_architecture,Unnamed: 1_level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2,Unnamed: 22_level_2,Unnamed: 23_level_2,Unnamed: 24_level_2,Unnamed: 25_level_2,Unnamed: 26_level_2,Unnamed: 27_level_2,Unnamed: 28_level_2,Unnamed: 29_level_2,Unnamed: 30_level_2,Unnamed: 31_level_2,Unnamed: 32_level_2,Unnamed: 33_level_2,Unnamed: 34_level_2,Unnamed: 35_level_2,Unnamed: 36_level_2,Unnamed: 37_level_2,Unnamed: 38_level_2,Unnamed: 39_level_2,Unnamed: 40_level_2,Unnamed: 41_level_2,Unnamed: 42_level_2,Unnamed: 43_level_2,Unnamed: 44_level_2,Unnamed: 45_level_2,Unnamed: 46_level_2,Unnamed: 47_level_2,Unnamed: 48_level_2
efficientnet,5.0,0.271129,0.007888,0.26179,0.266514,0.2704,0.274468,0.282474,5.0,0.405789,0.010088,0.393204,0.400478,0.406024,0.408946,0.420297,5.0,0.393269,0.009688,0.381409,0.3872,0.392268,0.399748,0.405717,5.0,0.554679,0.013743,0.542057,0.544189,0.549394,0.563638,0.574118,5.0,0.867242,0.005926,0.862651,0.862943,0.866673,0.866687,0.877257,5.0,0.797713,0.007162,0.787529,0.796918,0.796974,0.799593,0.807549
inception,5.0,0.286989,0.003142,0.282876,0.285292,0.286697,0.289334,0.290746,5.0,0.429647,0.002934,0.426046,0.427899,0.429821,0.430654,0.433814,5.0,0.428529,0.00898,0.413634,0.426444,0.433896,0.434073,0.434598,5.0,0.552176,0.009373,0.539631,0.549436,0.552004,0.554117,0.565694,5.0,0.858466,0.0047,0.854257,0.856683,0.857237,0.857612,0.866542,5.0,0.81803,0.005072,0.811113,0.814779,0.819738,0.82056,0.823961
inceptionresnet,5.0,0.23309,0.004154,0.228076,0.231333,0.231344,0.236485,0.238211,5.0,0.361777,0.005437,0.355904,0.358473,0.359446,0.366745,0.368314,5.0,0.418676,0.008283,0.406971,0.414296,0.420061,0.424001,0.428054,5.0,0.421319,0.010544,0.405415,0.418431,0.421312,0.428892,0.432546,5.0,0.845584,0.003606,0.839471,0.846076,0.84664,0.846672,0.849063,5.0,0.866485,0.00465,0.85897,0.865476,0.868195,0.868701,0.871084
mobilenetv1,5.0,0.248339,0.004474,0.243787,0.245216,0.246927,0.251104,0.25466,5.0,0.382329,0.005918,0.376158,0.377497,0.381438,0.386385,0.390165,5.0,0.381843,0.007174,0.374786,0.376579,0.378802,0.388766,0.390281,5.0,0.491009,0.015294,0.474639,0.476108,0.493969,0.500919,0.509411,5.0,0.84427,0.004619,0.838195,0.840415,0.847075,0.847415,0.848248,5.0,0.809452,0.010053,0.79611,0.803428,0.809326,0.819063,0.819331
mobilenetv2,5.0,0.265011,0.012498,0.254713,0.256548,0.262732,0.265028,0.286033,5.0,0.402131,0.015731,0.389625,0.391474,0.399249,0.401506,0.428799,5.0,0.443537,0.019976,0.430108,0.433441,0.433913,0.441783,0.478439,5.0,0.458167,0.013677,0.441388,0.451354,0.458113,0.461603,0.478378,5.0,0.841221,0.004902,0.834892,0.837517,0.842935,0.843831,0.846931,5.0,0.858106,0.006174,0.852924,0.855554,0.856415,0.856823,0.868812
nasnetmobile,5.0,0.298781,0.004685,0.292928,0.297742,0.298184,0.299056,0.305993,5.0,0.44066,0.006486,0.432673,0.439015,0.439395,0.441593,0.450625,5.0,0.417228,0.009942,0.405413,0.408077,0.420157,0.425618,0.426875,5.0,0.60595,0.004837,0.600031,0.603158,0.604791,0.610274,0.611493,5.0,0.876292,0.004403,0.872189,0.873298,0.873914,0.880246,0.881811,5.0,0.803159,0.005238,0.796839,0.798919,0.804616,0.805673,0.809747
resnet,5.0,0.193838,0.017544,0.179002,0.180388,0.183897,0.212342,0.21356,5.0,0.303606,0.02364,0.282943,0.286064,0.290436,0.327363,0.331224,5.0,0.348565,0.009366,0.337207,0.342735,0.347249,0.355078,0.360556,5.0,0.373724,0.064427,0.304621,0.319836,0.365995,0.426418,0.451748,5.0,0.836658,0.007693,0.829035,0.831641,0.832717,0.844486,0.845411,5.0,0.839295,0.026799,0.808858,0.821387,0.833353,0.858791,0.874084
resnetv2,5.0,0.264114,0.005328,0.257162,0.261158,0.263866,0.267632,0.270751,5.0,0.404987,0.006501,0.396921,0.40061,0.404829,0.409638,0.412935,5.0,0.505571,0.007547,0.494863,0.500518,0.509497,0.510438,0.512537,5.0,0.417159,0.005567,0.411956,0.413348,0.414161,0.422389,0.423943,5.0,0.843555,0.003993,0.83878,0.839851,0.845506,0.845784,0.847854,5.0,0.909117,0.002574,0.905742,0.907224,0.909756,0.910984,0.911879
vgg,5.0,0.201695,0.038193,0.150934,0.177983,0.20291,0.236008,0.240643,5.0,0.321106,0.05187,0.251019,0.289337,0.324886,0.367231,0.373055,5.0,0.465579,0.02063,0.450675,0.45088,0.459825,0.465852,0.500664,5.0,0.296954,0.078859,0.194953,0.244777,0.297882,0.372025,0.375134,5.0,0.824502,0.014583,0.803059,0.817391,0.827661,0.835224,0.839175,5.0,0.922428,0.025428,0.896627,0.900635,0.91989,0.937942,0.957048
xception,5.0,0.298148,0.005708,0.291791,0.292621,0.300193,0.301225,0.304908,5.0,0.442962,0.00692,0.435429,0.435994,0.445625,0.446744,0.451016,5.0,0.487938,0.007308,0.477525,0.484077,0.49025,0.491327,0.496509,5.0,0.50685,0.01441,0.493753,0.500676,0.501561,0.507056,0.531202,5.0,0.85456,0.006534,0.847916,0.850218,0.854232,0.855543,0.86489,5.0,0.871332,0.001892,0.868596,0.870648,0.871202,0.872936,0.873276


## Per characteristic metrics

In [47]:
def get_per_characteristic_metrics(results_path, model_name, images_path, masks_path, classes, columns, characteristics):
    gradcams_path = results_path / 'visualisation/gradcam' / model_name
    model_path = results_path / model_name
    
    derm_mask_paths = [mask_path for mask_path in masks_path.iterdir() if mask_path.suffix == '.png']
    image_paths = [image_path for image_path in images_path.rglob('*.jpeg')]

    # For each image in the test set, calculate the value of the defined metrics given the GradCam image for a given
    # class and the outline made by a specific derm for a given characteristic. The result is stored in a defaultdict.
    # As a sanity check, the number of matches between GradCam images and derm annotations is also calculated.
    metrics_list = []

    # Set the method used for interpolation when resizing the derm annotations.
    interpolation = Image.NEAREST

    # Compute metrics for each image
    for image_path in image_paths:
        for characteristic in characteristics:
            for diagnosis in classes:
                # Check if matching GradCam file exists.
                gradcam_path = gradcams_path / Path(image_path.stem + '_' + diagnosis + '.npy')
                if gradcam_path.is_file():
                    mask_path = masks_path / Path(f'{characteristic}_{image_path.stem}.png') 
                    if mask_path.is_file():
                        # Calculate the value of the metics given the GradCam image and the derm mask.
                        gradcam_metric_val = calculate_mask_metrics(gradcam_path, mask_path, interpolation)
                        gradcam_metric_val['gradcam_class'] = diagnosis 
                        gradcam_metric_val['characteristic'] = characteristic 
                        gradcam_metric_val['filename'] = image_path.stem 
                        metrics_list.append(gradcam_metric_val)
                else:
                    print(f'GradCam file missing for image {image_path}')
                
    return pd.DataFrame.from_records(metrics_list, columns=columns)


In [96]:
def analyse_per_characteristics_gradcam(
    results_path, 
    model_name, 
    images_path, 
    masks_path, 
    preds_name,
    columns,
    classes,
    characteristics,
    metrics
):
    per_image_metrics_df = get_per_characteristic_metrics(results_path, model_name, images_path, masks_path, classes, columns, characteristics)
    preds_df = pd.read_csv(results_path / preds_name)
    preds_df['filename'] = [filename.split('/')[1].split('.')[0] for filename in preds_df.filename.values]
    preds_df = preds_df.merge(per_image_metrics_df, left_on='filename', right_on='filename')
    # Keep only correct predictions
    preds_df = preds_df[preds_df['actual'] == preds_df['pred']]
    preds_df = preds_df[preds_df['pred_class'] == preds_df['gradcam_class']]

    metrics_dict = {}
    for characteristic in characteristics:
        metrics_dict[characteristic] = {}
        for metric in metrics:
            metrics_dict[characteristic][metric] = preds_df[preds_df['characteristic'] == characteristic][metric].mean()
            
    return metrics_dict


In [120]:
model_info = [
    {
        'model_name': 'efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_',
        'model_architecture': 'efficientnet',
    },
    {
        'model_name': 'inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_',
        'model_architecture': 'inception',
    },
    {
        'model_name': 'inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_',
        'model_architecture': 'inceptionresnet',
    },
    {
        'model_name': 'mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_',
        'model_architecture': 'mobilenetv1',
    },
    {
        'model_name': 'mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_',
        'model_architecture': 'mobilenetv2',
    },
    {
        'model_name': 'nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_',
        'model_architecture': 'nasnetmobile',
    },
    {
        'model_name': 'resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_',
        'model_architecture': 'resnet',
    },
    {
        'model_name': 'resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_',
        'model_architecture': 'resnetv2',
    },
    {
        'model_name': 'vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_',
        'model_architecture': 'vgg',
    },
    {
        'model_name': 'xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_', 
        'model_architecture': 'xception',
    }
]
masks_path = Path('/home/ubuntu/hot-store/dermx_masks/per_characteristic')
columns = [
    'filename',
    'gradcam_class',
    'characteristic',
    'iou',
    'dice',
    'precision',
    'recall',
    'negative_predictive_value',
    'specificity'
]
metrics = [
    'iou',
    'dice',
    'precision',
    'recall',
    'negative_predictive_value',
    'specificity'
]

models_performance_dict = {}
for model in model_info:
    for idx in range(5):
        model_results_path = results_path / model['model_architecture']
        model_name = f'{model["model_name"]}{idx}'
        preds_name = f'dermx_{idx}_preds.csv'
        print(model_name)
        model_performance = analyse_per_characteristics_gradcam(model_results_path, model_name, images_path, masks_path, preds_name, columns, classes, characteristics, metrics)
        for k, v in model_performance.items():
            models_performance_dict[(model['model_architecture'], model_name, k)] = v

models_performance_df = pd.DataFrame(models_performance_dict).T

efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_0




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_1




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_2




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_3




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_4




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_0




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_1




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_2




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_3




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_4




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_0




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_1




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_2




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_3




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_4




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_0




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_1




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_2




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_3




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_4




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_0




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_1




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_2




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_3




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_4




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_0




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_1




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_2




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_3




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_4




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_0




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_1




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_2




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_3




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_4




resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_0
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_1
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_2




resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_3
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_4
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_0
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_1
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_2




vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_3




vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_4




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_0




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_1




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_2




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_3




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_4




In [123]:
models_performance_df.reset_index().groupby(['level_0', 'level_2']).describe()

Unnamed: 0_level_0,Unnamed: 1_level_0,iou,iou,iou,iou,iou,iou,iou,iou,dice,dice,dice,dice,dice,dice,dice,dice,precision,precision,precision,precision,precision,precision,precision,precision,recall,recall,recall,recall,recall,recall,recall,recall,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,specificity,specificity,specificity,specificity,specificity,specificity,specificity,specificity
Unnamed: 0_level_1,Unnamed: 1_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max
level_0,level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2,Unnamed: 22_level_2,Unnamed: 23_level_2,Unnamed: 24_level_2,Unnamed: 25_level_2,Unnamed: 26_level_2,Unnamed: 27_level_2,Unnamed: 28_level_2,Unnamed: 29_level_2,Unnamed: 30_level_2,Unnamed: 31_level_2,Unnamed: 32_level_2,Unnamed: 33_level_2,Unnamed: 34_level_2,Unnamed: 35_level_2,Unnamed: 36_level_2,Unnamed: 37_level_2,Unnamed: 38_level_2,Unnamed: 39_level_2,Unnamed: 40_level_2,Unnamed: 41_level_2,Unnamed: 42_level_2,Unnamed: 43_level_2,Unnamed: 44_level_2,Unnamed: 45_level_2,Unnamed: 46_level_2,Unnamed: 47_level_2,Unnamed: 48_level_2,Unnamed: 49_level_2
efficientnet,Closed comedo,5.0,0.131268,0.007443,0.123977,0.126396,0.12735,0.139236,0.139381,5.0,0.197302,0.009332,0.187647,0.191805,0.192412,0.207047,0.2076,5.0,0.176232,0.00832,0.167476,0.169139,0.175081,0.183308,0.186158,5.0,0.534995,0.017231,0.512496,0.52744,0.530334,0.552139,0.552565,5.0,0.955275,0.002181,0.951521,0.955714,0.955955,0.955956,0.957227,5.0,0.751385,0.013026,0.735161,0.746358,0.749553,0.755164,0.770689
efficientnet,Cyst,5.0,0.020709,0.002862,0.017472,0.018319,0.021038,0.022252,0.024463,5.0,0.039189,0.005294,0.03329,0.034804,0.039673,0.041874,0.046305,5.0,0.022058,0.003384,0.018258,0.019171,0.022654,0.023663,0.026542,5.0,0.41794,0.036681,0.364049,0.405244,0.416502,0.451373,0.452532,5.0,0.992149,0.000304,0.991881,0.99195,0.992072,0.99219,0.992651,5.0,0.739559,0.013552,0.721712,0.735265,0.737313,0.744849,0.758656
efficientnet,Dermatoglyph disruption,0.0,,,,,,,,0.0,,,,,,,,0.0,,,,,,,,0.0,,,,,,,,0.0,,,,,,,,0.0,,,,,,,
efficientnet,Leukotrichia,5.0,0.084602,0.012101,0.069894,0.074229,0.089178,0.090935,0.098772,5.0,0.152961,0.022027,0.125308,0.135272,0.161315,0.164061,0.178847,5.0,0.185899,0.061132,0.103795,0.16704,0.179265,0.207921,0.271472,5.0,0.306961,0.055604,0.259863,0.286258,0.289224,0.29612,0.403337,5.0,0.836446,0.058589,0.806351,0.807145,0.811622,0.816089,0.941021,5.0,0.79447,0.043075,0.738302,0.762098,0.80637,0.824405,0.841174
efficientnet,Macule,5.0,0.123511,0.009233,0.110574,0.121344,0.122987,0.126504,0.136148,5.0,0.194876,0.013101,0.177714,0.191193,0.192923,0.198703,0.213849,5.0,0.220208,0.019184,0.196052,0.213589,0.216734,0.226235,0.248427,5.0,0.409264,0.02155,0.379299,0.402314,0.404135,0.429466,0.431105,5.0,0.872179,0.014491,0.859006,0.86531,0.869093,0.870663,0.896824,5.0,0.760656,0.013733,0.747031,0.754949,0.757814,0.759862,0.783622
efficientnet,Nodule,5.0,0.03667,0.00355,0.032114,0.034941,0.037198,0.037331,0.041765,5.0,0.06292,0.006326,0.055142,0.06002,0.062873,0.064179,0.072384,5.0,0.044945,0.004323,0.038896,0.043481,0.045721,0.045791,0.050837,5.0,0.43913,0.015278,0.421402,0.430393,0.436381,0.446362,0.461112,5.0,0.980085,0.000699,0.979364,0.979405,0.980092,0.980762,0.980802,5.0,0.735823,0.015352,0.717573,0.730667,0.731052,0.740873,0.75895
efficientnet,Open comedo,5.0,0.123508,0.003335,0.118555,0.121628,0.125128,0.125781,0.126446,5.0,0.189092,0.00311,0.184456,0.187299,0.190884,0.191353,0.191469,5.0,0.173074,0.005149,0.164928,0.173348,0.173488,0.174391,0.179215,5.0,0.494639,0.010895,0.477061,0.492601,0.498191,0.499506,0.505837,5.0,0.944388,0.002557,0.942061,0.942111,0.943544,0.947074,0.947149,5.0,0.760735,0.013714,0.742818,0.758526,0.758934,0.762142,0.781256
efficientnet,Papule,5.0,0.1007,0.006568,0.092858,0.095145,0.101529,0.106484,0.107486,5.0,0.156429,0.009693,0.145678,0.147218,0.157951,0.164413,0.166886,5.0,0.127023,0.011125,0.114295,0.11623,0.130714,0.135148,0.138726,5.0,0.589126,0.022561,0.557815,0.579244,0.58787,0.605082,0.615617,5.0,0.966005,0.004443,0.962334,0.962857,0.963566,0.968794,0.972474,5.0,0.735609,0.007013,0.726716,0.731954,0.734788,0.739626,0.744961
efficientnet,Patch,5.0,0.140935,0.005029,0.134103,0.139104,0.139806,0.144845,0.146816,5.0,0.228923,0.007682,0.217918,0.226872,0.227286,0.236092,0.23645,5.0,0.219745,0.013299,0.20144,0.212394,0.220593,0.229915,0.234382,5.0,0.365316,0.017929,0.342495,0.357913,0.363539,0.371445,0.39119,5.0,0.887977,0.009308,0.873872,0.883971,0.891648,0.892565,0.897829,5.0,0.778051,0.010052,0.765241,0.774287,0.777877,0.779881,0.792968
efficientnet,Plaque,5.0,0.202421,0.004258,0.197724,0.200845,0.201229,0.203096,0.209212,5.0,0.318556,0.004735,0.313037,0.315896,0.317888,0.320475,0.325487,5.0,0.325089,0.003582,0.321226,0.321448,0.326533,0.326955,0.329283,5.0,0.439018,0.014139,0.425091,0.429667,0.436517,0.442432,0.461385,5.0,0.828322,0.008812,0.823194,0.823209,0.824465,0.826887,0.843854,5.0,0.769597,0.008573,0.757784,0.768551,0.769758,0.769919,0.781974


## Per derm

In [139]:
def get_per_derm_metrics(results_path, model_name, images_path, masks_path, classes, columns, derms):
    gradcams_path = results_path / 'visualisation/gradcam' / model_name
    model_path = results_path / model_name
    
    derm_mask_paths = [mask_path for mask_path in masks_path.iterdir() if mask_path.suffix == '.png']
    image_paths = [image_path for image_path in images_path.rglob('*.jpeg')]

    # For each image in the test set, calculate the value of the defined metrics given the GradCam image for a given
    # class and the outline made by a specific derm for a given characteristic. The result is stored in a defaultdict.
    # As a sanity check, the number of matches between GradCam images and derm annotations is also calculated.
    metrics_list = []

    # Set the method used for interpolation when resizing the derm annotations.
    interpolation = Image.NEAREST

    # Compute metrics for each image
    for image_path in image_paths:
        for derm in derms:
            for diagnosis in classes:
                # Check if matching GradCam file exists.
                gradcam_path = gradcams_path / Path(image_path.stem + '_' + diagnosis + '.npy')
                if gradcam_path.is_file():
                    mask_path = masks_path / Path(f'{derm}_{image_path.stem}.png') 
                    if mask_path.is_file():
                        # Calculate the value of the metics given the GradCam image and the derm mask.
                        gradcam_metric_val = calculate_mask_metrics(gradcam_path, mask_path, interpolation)
                        gradcam_metric_val['gradcam_class'] = diagnosis 
                        gradcam_metric_val['derm'] = derm
                        gradcam_metric_val['filename'] = image_path.stem 
                        metrics_list.append(gradcam_metric_val)
                else:
                    print(f'GradCam file missing for image {image_path}')
                
    return pd.DataFrame.from_records(metrics_list, columns=columns)


In [143]:
def analyse_per_derms_gradcam(
    results_path, 
    model_name, 
    images_path, 
    masks_path, 
    preds_name,
    columns,
    classes,
    derms,
    metrics
):
    per_image_metrics_df = get_per_derm_metrics(results_path, model_name, images_path, masks_path, classes, columns, derms)
    preds_df = pd.read_csv(results_path / preds_name)
    preds_df['filename'] = [filename.split('/')[1].split('.')[0] for filename in preds_df.filename.values]
    preds_df = preds_df.merge(per_image_metrics_df, left_on='filename', right_on='filename')
    # Keep only correct predictions
    preds_df = preds_df[preds_df['actual'] == preds_df['pred']]
    preds_df = preds_df[preds_df['pred_class'] == preds_df['gradcam_class']]
    metrics_dict = {}
    for derm in derms:
        metrics_dict[derm] = {}
        for metric in metrics:
            metrics_dict[derm][metric] = preds_df[preds_df['derm'] == derm][metric].mean()
            
    return metrics_dict


In [146]:
model_info = [
    {
        'model_name': 'efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_',
        'model_architecture': 'efficientnet',
    },
    {
        'model_name': 'inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_',
        'model_architecture': 'inception',
    },
    {
        'model_name': 'inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_',
        'model_architecture': 'inceptionresnet',
    },
    {
        'model_name': 'mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_',
        'model_architecture': 'mobilenetv1',
    },
    {
        'model_name': 'mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_',
        'model_architecture': 'mobilenetv2',
    },
    {
        'model_name': 'nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_',
        'model_architecture': 'nasnetmobile',
    },
    {
        'model_name': 'resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_',
        'model_architecture': 'resnet',
    },
    {
        'model_name': 'resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_',
        'model_architecture': 'resnetv2',
    },
    {
        'model_name': 'vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_',
        'model_architecture': 'vgg',
    },
    {
        'model_name': 'xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_', 
        'model_architecture': 'xception',
    }
]
masks_path = Path('/home/ubuntu/hot-store/dermx_masks/per_derm')
columns = [
    'filename',
    'gradcam_class',
    'derm',
    'iou',
    'dice',
    'precision',
    'recall',
    'negative_predictive_value',
    'specificity'
]
metrics = [
    'iou',
    'dice',
    'precision',
    'recall',
    'negative_predictive_value',
    'specificity'
]

models_performance_dict = {}
for model in model_info:
    for idx in range(5):
        model_results_path = results_path / model['model_architecture']
        model_name = f'{model["model_name"]}{idx}'
        preds_name = f'dermx_{idx}_preds.csv'
        print(model_name)
        model_performance = analyse_per_derms_gradcam(model_results_path, model_name, images_path, masks_path, preds_name, columns, classes, derms, metrics)

        for k, v in model_performance.items():
            models_performance_dict[(model['model_architecture'], model_name, k)] = v

models_performance_df = pd.DataFrame(models_performance_dict).T

efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_0




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_1




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_2




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_3




efficientnetb0_r20_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock6d_add_4




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_0




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_1




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_2




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_3




inception_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.001_lactivation_85_4




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_0




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_1




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_2




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_3




inceptionresnetv2_r20_s0.25_z0.5_b[0.75, 1.25]_lr0.0001_lblock8_9_ac_4




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_0




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_1




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_2




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_3




mobilenetv1_r10_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv_pw_12_relu_4




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_0




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_1




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_2




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_3




mobilenetv2_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.0001_lblock_15_add_4




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_0




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_1




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_2




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_3




nasnetmobile_r20_s0.25_z0.5_b[0.5, 1.0]_lr0.0001_lnormal_concat_11_4




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_0




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_1




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_2




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_3




resnet50_r20_s0.5_z0.5_b[0.5, 1.5]_lr0.0001_lconv5_block3_out_4




resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_0
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_1
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_2




resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_3
resnetv2_r20_s0.25_z0.25_b[0.5, 1.0]_lr0.001_lpost_relu_4
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_0
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_1
vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_2




vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_3




vgg_r10_s0.0_z0.25_b[0.5, 1.0]_lr0.01_lblock5_pool_4




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_0




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_1




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_2




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_3




xception_r10_s0.25_z0.5_b[0.5, 1.5]_lr0.001_lblock14_sepconv2_act_4




In [151]:
models_performance_df.reset_index().groupby(['level_0', 'level_2']).describe()

Unnamed: 0_level_0,Unnamed: 1_level_0,iou,iou,iou,iou,iou,iou,iou,iou,dice,dice,dice,dice,dice,dice,dice,dice,precision,precision,precision,precision,precision,precision,precision,precision,recall,recall,recall,recall,recall,recall,recall,recall,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,negative_predictive_value,specificity,specificity,specificity,specificity,specificity,specificity,specificity,specificity
Unnamed: 0_level_1,Unnamed: 1_level_1,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max,count,mean,std,min,25%,50%,75%,max
level_0,level_2,Unnamed: 2_level_2,Unnamed: 3_level_2,Unnamed: 4_level_2,Unnamed: 5_level_2,Unnamed: 6_level_2,Unnamed: 7_level_2,Unnamed: 8_level_2,Unnamed: 9_level_2,Unnamed: 10_level_2,Unnamed: 11_level_2,Unnamed: 12_level_2,Unnamed: 13_level_2,Unnamed: 14_level_2,Unnamed: 15_level_2,Unnamed: 16_level_2,Unnamed: 17_level_2,Unnamed: 18_level_2,Unnamed: 19_level_2,Unnamed: 20_level_2,Unnamed: 21_level_2,Unnamed: 22_level_2,Unnamed: 23_level_2,Unnamed: 24_level_2,Unnamed: 25_level_2,Unnamed: 26_level_2,Unnamed: 27_level_2,Unnamed: 28_level_2,Unnamed: 29_level_2,Unnamed: 30_level_2,Unnamed: 31_level_2,Unnamed: 32_level_2,Unnamed: 33_level_2,Unnamed: 34_level_2,Unnamed: 35_level_2,Unnamed: 36_level_2,Unnamed: 37_level_2,Unnamed: 38_level_2,Unnamed: 39_level_2,Unnamed: 40_level_2,Unnamed: 41_level_2,Unnamed: 42_level_2,Unnamed: 43_level_2,Unnamed: 44_level_2,Unnamed: 45_level_2,Unnamed: 46_level_2,Unnamed: 47_level_2,Unnamed: 48_level_2,Unnamed: 49_level_2
efficientnet,derm1,5.0,0.180183,0.008962,0.172147,0.174024,0.176063,0.185213,0.193467,5.0,0.283701,0.012872,0.273929,0.274954,0.276195,0.289797,0.303631,5.0,0.261647,0.014891,0.24159,0.250661,0.266877,0.273231,0.275875,5.0,0.491409,0.018749,0.465269,0.484611,0.489628,0.502821,0.514714,5.0,0.893486,0.006547,0.886434,0.888147,0.892456,0.899179,0.901215,5.0,0.775859,0.010792,0.764644,0.76636,0.774352,0.786376,0.787561
efficientnet,derm2,5.0,0.206976,0.006639,0.199934,0.203,0.20682,0.207643,0.217484,5.0,0.321327,0.009539,0.311906,0.313539,0.322278,0.32307,0.33584,5.0,0.314412,0.007838,0.305205,0.310097,0.311573,0.322128,0.323056,5.0,0.514495,0.009844,0.506041,0.506102,0.510106,0.524425,0.525802,5.0,0.859989,0.005985,0.854507,0.855267,0.857352,0.865535,0.867284,5.0,0.768529,0.008605,0.759394,0.765314,0.767509,0.767733,0.782697
efficientnet,derm3,5.0,0.220569,0.014794,0.20339,0.213382,0.216292,0.227813,0.241969,5.0,0.34234,0.019691,0.317858,0.334212,0.33673,0.353585,0.369314,5.0,0.331013,0.012562,0.316156,0.326222,0.329904,0.332151,0.350634,5.0,0.483902,0.029493,0.444338,0.474015,0.475869,0.505586,0.519701,5.0,0.848969,0.009246,0.839597,0.845687,0.845811,0.849513,0.864236,5.0,0.770981,0.008208,0.757646,0.770152,0.771696,0.777687,0.777726
efficientnet,derm4,5.0,0.223289,0.008617,0.215216,0.217499,0.21845,0.23263,0.232649,5.0,0.339788,0.010252,0.330157,0.332762,0.334216,0.350581,0.351222,5.0,0.359607,0.015205,0.339321,0.348228,0.364418,0.372885,0.373184,5.0,0.450145,0.009504,0.436871,0.447963,0.448589,0.454571,0.462729,5.0,0.829947,0.006811,0.821459,0.82846,0.829221,0.830123,0.84047,5.0,0.786308,0.008788,0.775485,0.77956,0.787862,0.791531,0.797104
efficientnet,derm5,5.0,0.21633,0.004655,0.210022,0.212934,0.218063,0.219776,0.220854,5.0,0.333527,0.006138,0.324659,0.330138,0.33623,0.336347,0.34026,5.0,0.337075,0.006414,0.326631,0.336732,0.338691,0.339344,0.343976,5.0,0.468853,0.009907,0.457341,0.463626,0.464932,0.477763,0.480601,5.0,0.834181,0.010787,0.825472,0.828804,0.829655,0.834348,0.852625,5.0,0.774513,0.006488,0.768038,0.769741,0.77372,0.776624,0.784442
efficientnet,derm6,5.0,0.205423,0.005173,0.197133,0.20418,0.207144,0.208051,0.210608,5.0,0.323758,0.006545,0.313732,0.321402,0.325944,0.326795,0.330918,5.0,0.307446,0.008887,0.29774,0.299556,0.307967,0.313386,0.318578,5.0,0.498855,0.007951,0.489835,0.490594,0.503343,0.504439,0.506064,5.0,0.85705,0.004199,0.853691,0.853951,0.855263,0.858675,0.863669,5.0,0.760029,0.004251,0.752805,0.759929,0.761353,0.762617,0.763439
efficientnet,derm7,5.0,0.165199,0.005951,0.158387,0.159348,0.167914,0.168732,0.171615,5.0,0.263995,0.007761,0.254926,0.256804,0.267318,0.267992,0.272937,5.0,0.226725,0.011196,0.215849,0.21842,0.224214,0.23155,0.243594,5.0,0.507295,0.009602,0.499819,0.500506,0.504023,0.508911,0.523217,5.0,0.916709,0.006781,0.906311,0.91523,0.916475,0.922383,0.923144,5.0,0.772118,0.008006,0.761382,0.766533,0.773935,0.778532,0.780209
efficientnet,derm8,5.0,0.261083,0.004252,0.255101,0.258517,0.262419,0.263649,0.26573,5.0,0.390028,0.004999,0.38268,0.387493,0.391321,0.393625,0.395022,5.0,0.416969,0.007763,0.408285,0.411995,0.417312,0.418524,0.428731,5.0,0.490869,0.010321,0.481267,0.48378,0.489906,0.491734,0.50766,5.0,0.820387,0.005919,0.815876,0.817009,0.818582,0.819845,0.830625,5.0,0.79848,0.005738,0.791647,0.79655,0.797601,0.799178,0.807427
inception,derm1,5.0,0.186577,0.00404,0.18082,0.18509,0.186111,0.190373,0.190491,5.0,0.296987,0.004996,0.290232,0.293802,0.297649,0.301078,0.302174,5.0,0.266481,0.004841,0.262848,0.263407,0.264801,0.266609,0.274742,5.0,0.5013,0.012047,0.485838,0.493344,0.503055,0.507634,0.516628,5.0,0.891503,0.003088,0.886995,0.889684,0.892752,0.893889,0.894198,5.0,0.766621,0.004733,0.75874,0.766199,0.768195,0.768938,0.771034
inception,derm2,5.0,0.217086,0.00525,0.210214,0.213385,0.21849,0.220036,0.223302,5.0,0.337102,0.006904,0.327339,0.332732,0.3404,0.340691,0.344348,5.0,0.341967,0.005478,0.335629,0.339512,0.341702,0.342447,0.350543,5.0,0.503252,0.017795,0.485591,0.489298,0.497218,0.51936,0.524795,5.0,0.848553,0.00458,0.844827,0.845534,0.845777,0.851326,0.8553,5.0,0.791231,0.00555,0.78538,0.78792,0.788516,0.796987,0.797354


### Old

In [2]:
# Set paths

# Path to the GradCam images.
gradcam_main_path = Path('/home/ubuntu/store/efficientnet-final-size/visualisation/gradcam/')

# Set path to the model used to create the visualisations.
model_path = Path('efficientnetb4_0')

# Path to the masks create by the derms for the individual characteristics.
derm_mask_main_path = Path('/home/ubuntu/store/masks/masks_resized')

# Path to the rescaled test images.
test_im_path = Path('/home/ubuntu/store/DermX-test-set/test/')


In [3]:
full_gradcam_path = gradcam_main_path / model_path
full_lime_path = lime_main_path / model_path

In [4]:
classes = [
    "Acne",
    "Actinic keratosis",
    "Psoriasis",
    "Seborrheic dermatitis",
    "Viral warts",
    "Vitiligo"
]

derms = [
    'derm0',
    'derm1',
    'derm2',
    'derm3',
    'derm4',
    'derm5',
    'derm6',
    'derm7',
]

chars = [
    'closed-comedo',
    'cyst',
    'dermatoglyph-disruption',
    'leukotrichia',
    'macule',
    'nodule',
    'open-comedo',
    'papule',
    'patch',
    'plaque',
    'pustule',
    'scale',
    'scar',
    'sun-damage',
    'telangiectasia',
    'thrombosed-capillaries'
]


In [5]:
# Extract the paths to the derm masks. The resulting list is only used for a sanity check.
derm_mask_paths = [p for p in derm_mask_main_path.iterdir() if p.suffix == '.png']
derm_mask_paths[0:5]

[PosixPath('/home/ubuntu/store/masks/masks_spinaltap/043023HB_mihaela_2021-05-27-masks_plaque.png'),
 PosixPath('/home/ubuntu/store/masks/masks_spinaltap/043212HB_adelina_2021-05-27-masks_scale.png'),
 PosixPath('/home/ubuntu/store/masks/masks_spinaltap/043269HB_adelina_2021-05-27-masks_papule.png'),
 PosixPath('/home/ubuntu/store/masks/masks_spinaltap/293--WatermarkedWyJXYXRlcm1hcmtlZCJd_mihaela_2021-05-27-masks_scale.png'),
 PosixPath('/home/ubuntu/store/masks/masks_spinaltap/viral-wart-08--WatermarkedWyJXYXRlcm1hcmtlZCJd_oana_2021-05-27-masks_papule.png')]

In [6]:
# Extract the paths to the test images. Only needed for visualization and debugging.
test_img_paths = [p for p in Path(test_im_path).rglob('*.jpeg')]
test_img_paths[0:5]

[PosixPath('/home/ubuntu/store/DermX-test-set/test/Actinic keratosis/017359HB.jpeg'),
 PosixPath('/home/ubuntu/store/DermX-test-set/test/Actinic keratosis/476--WatermarkedWyJXYXRlcm1hcmtlZCJd.jpeg'),
 PosixPath('/home/ubuntu/store/DermX-test-set/test/Actinic keratosis/469--WatermarkedWyJXYXRlcm1hcmtlZCJd.jpeg'),
 PosixPath('/home/ubuntu/store/DermX-test-set/test/Actinic keratosis/3742--WatermarkedWyJXYXRlcm1hcmtlZCJd.jpeg'),
 PosixPath('/home/ubuntu/store/DermX-test-set/test/Actinic keratosis/3753--WatermarkedWyJXYXRlcm1hcmtlZCJd.jpeg')]

In [7]:
# Metrics supporting probabilistic segmentation maps
fuzzy_and = lambda x,y: np.minimum(x,y)
fuzzy_or = lambda x,y: np.maximum(x,y)
fuzzy_not = lambda x: 1-x

def pixel_metrics_fuzzy(y_true, y_pred):
    """
    Pixel-level metrics of segmentation accuracy following fuzzy logic operators.
    
    :param y_true: numpy.ndarray of reference segmentation, values in [0,1]
    :param y_pred: numpy.ndarray of predicted segmentation, values in [0,1]

    :return: a dictionary encoding the metrics
    """
        
    np.testing.assert_equal(y_true.shape, y_pred.shape, err_msg="Expecting \
    the reference and predicted segmentations to be of the same size.")
    
    # Check the ranges
    np.testing.assert_equal(np.logical_and(y_true >= 0, y_true <= 1).all(), True, err_msg="Expecting \
    the reference segmentations to be in the range 0 to 1.")
    np.testing.assert_equal(np.logical_and(y_pred >= 0, y_pred <= 1).all(), True, err_msg="Expecting \
    the predicted segmentations to be in the range 0 to 1.")
    
    TP = fuzzy_and(y_true, y_pred).sum()
    TN = fuzzy_and(fuzzy_not(y_true), fuzzy_not(y_pred)).sum()
    union = fuzzy_or(y_true, y_pred).sum()
    
    metrics = {}
    
    # Summary metrics
    metrics["iou"] = TP / union
    metrics["dice"] = 2 * TP / ( y_true.sum() + y_pred.sum() ) 
    
    # Positive class metrics
    metrics["precision"] = TP / y_pred.sum()
    metrics["recall"] = TP / y_true.sum()
    
    # Negative class metrics
    metrics["negative_predictive_value"] = TN / fuzzy_not(y_pred).sum()
    metrics["specificity"] = TN / fuzzy_not(y_true).sum()
    
    return metrics

In [8]:
def calc_res(gradcam_image_path, derm_char_mask_path, interpolation_method=Image.NEAREST):
    """
    Calculates the fuzzy logic metrics given the paths to a pair of input images.
    The derm mask is resized to match the size of the gradcam image.
    
    Input:
    - gradcam_image_path: Pathlib path to a gradCam image. The file is assumed to be in .npy format.
    - derm_char_mask_path: Pathlib path to a derm annotation. The file is assumed to be in a format that can
                           be opened by PIL.
    - interpolation_method: String. The method used for interpolation when resizing the derm mask. Options are
                            NEAREST, BOX, BILINEAR, HAMMING, BICUBIC, LANCZOS. Default is NEAREST.    
    """
    
    # Open images.
    gradcam_im = np.load(gradcam_image_path, allow_pickle=True)
    mask_im = Image.open(derm_char_mask_path)
    
    # Resize the derm mask if its size does not match the size of the gradcam image.
    if gradcam_im.shape != mask_im.size[::-1]:
        # Note that resize uses (cols, rows) format, while .shape is in (rows, cols) format.
        mask_im = mask_im.resize((gradcam_im.shape[::-1]), interpolation_method)
    
    # Corvert the derm mask to numpy format and normalize to [0, 1].
    mask_im = np.asarray(mask_im) / 255
  
    res = pixel_metrics_fuzzy(mask_im, gradcam_im)
    return res

In [9]:
# For each image in the test set, calculate the value of the defined metrics given the GradCam image for a given
# class and the outline made by a specific derm for a given characteristic. The result is stored in a defaultdict.
# As a sanity check, the number of matches between GradCam images and derm annotations is also calculated.
rec_dd = lambda: defaultdict(rec_dd)
out_gradcam = rec_dd()
hit_counter = 0

# Set the method used for interpolation when resizing the derm annotations.
interpolation = Image.NEAREST

for p in test_img_paths:
    for c in classes:
        # Check if matching GradCam file exists.
        gc_path = full_gradcam_path / Path(p.stem + '_' + c + '.npy')
        if gc_path.is_file():
            for d in derms:
                for ch in chars:
                    # Check if this derm has created a mask for this characteristic.
                    mask_path = derm_mask_main_path / Path(p.stem + '_' + d + '_2021-05-27-masks_' + ch + '.png') 
                    if mask_path.is_file():
                        # Calculate the value of the metics given the GradCam image and the derm mask.
                        gradcam_metric_val = calc_res(gc_path, mask_path, interpolation)
                        out_gradcam[p.stem][c][d][ch] = gradcam_metric_val
                        hit_counter += 1
        else:
            print('GradCam or LIME file missing for image: ', p)

print(hit_counter)



19578


In [12]:
# We expect that the value of the hit counter should be equal to the number of derm masks multiplied with the number
# of classes.
if len(derm_mask_paths)*6 != hit_counter:
    print('Oh no, some files were not found. Expected/found: ', len(derm_mask_paths)*6, hit_counter)
else:
    print('GradCam images found for all derm annotations.')


GradCam images found for all derm annotations.


In [13]:
def transform_to_list(nested_dict):
    # Transform the gradcam defaultdict to a list of tuples.
    
    out = []
    for im_name, class_dict in nested_dict.items():
        for class_name, derm_dict in class_dict.items():
            for derm_name, char_dict in derm_dict.items():
                for char_name, metric
                _dict in char_dict.items():
                    tmp = tuple(metric_dict.values())
                    out.append( (im_name, class_name, derm_name, char_name) + tmp )
    return out

In [14]:
gradcam_res_list = transform_to_list(out_gradcam)
len(gradcam_res_list)

19578

## Make output dataFrames/csv files

In [18]:
col_names = ['image_name',
             'visualisation_class',
             'derm',
             'characteristic',
             'iou',
             'dice',
             'precision',
             'recall',
             'negative_predictive_value',
             'specificity'
            ]

In [None]:
gradcam_df = pd.DataFrame.from_records(gradcam_res_list, columns=col_names)
gradcam_df

In [22]:
# Save dataFrames
model_name = str(model_path)
gradcam_df.to_csv(model_name + "_gradcam_scores.csv")


# Filter

In [123]:
import glob
model_names = glob.glob('/home/ubuntu/store/efficientnet-final-size/*h5')

In [124]:
model_names

['/home/ubuntu/store/efficientnet-final-size/efficientnetb4_4.h5',
 '/home/ubuntu/store/efficientnet-final-size/efficientnetb4_0.h5',
 '/home/ubuntu/store/efficientnet-final-size/efficientnetb4_2.h5',
 '/home/ubuntu/store/efficientnet-final-size/efficientnetb4_3.h5',
 '/home/ubuntu/store/efficientnet-final-size/efficientnetb4_1.h5']

In [125]:
model_name = Path(model_names[1]).stem

In [126]:
def get_table(results_pred):
    results_mean = results_pred.groupby('characteristic').median()
    results_std =  results_pred.groupby('characteristic').mad()
    
    ### Add means
    results_mean.loc['mean'] = results_mean.mean()
    results_std.loc['mean']   = results_mean.mean()
    
    columns = results_mean.columns.to_list()

    table_pred = results_mean
    return table_pred

class_map = {'0' : 'Acne' ,
             '1' : 'Actinic keratosis',
             '2' : 'Psoriasis' ,
             '3' : 'Seborrheic dermatitis',
             '4' : 'Viral warts',
             '5' : 'Vitiligo'}

filefolder = model_name + "_gradcam_scores.csv"
predsfile = '/home/ubuntu/store/efficientnet-final-size/' + model_name + '_preds.csv'

In [127]:
filtered_subjects = pd.read_csv('./include_images_525.csv')
filtered_subjects['image_id'] = filtered_subjects['image_id'].apply(lambda x: Path(x).stem)
filtered_subjects = filtered_subjects.rename(columns={'image_id': 'image_name'})
filtered_subjects = filtered_subjects.drop(columns=['Unnamed: 0'])

In [128]:
df_preds = pd.read_pickle(predsfile)
gradcam_df = pd.read_csv(filefolder)
gradcam_df=gradcam_df.drop(['Unnamed: 0'], axis=1)

In [129]:
df_preds['pred'] =  df_preds['pred'].apply(lambda x: class_map[str(x)])
df_preds['actual'] = df_preds['actual'].apply(lambda x: class_map[str(x)])
df_preds['filenames'] = df_preds['filenames'].apply(lambda x: Path(x).stem)
df_preds = df_preds.rename(columns={'filenames':'image_name'})
df_preds = df_preds.merge(filtered_subjects, on = 'image_name')

In [32]:
result = pd.merge(gradcam_df,df_preds, on = 'image_name')

results_pred = result[result.visualisation_class == result.pred]
table_pred = get_table(results_pred)
# Get it for actual
results_actual = result[result.visualisation_class == result.actual  ]
table_actual = get_table(results_actual)

table_pred.to_pickle('./' + model_name + '_gradcam_visualisation_scores_pred.pkl')
table_actual.to_pickle('./' + model_name + '_gradcam_visualisation_scores_actual.pkl')

results_equal = result[ (result.actual == result.pred) & (result.visualisation_class == result.pred) ]
table_equal = get_table(results_equal)

results_diff = result[ (result.actual != result.pred) & (result.visualisation_class == result.pred) ]
table_diff = get_table(results_diff)

table_equal.to_pickle('./' + model_name + '_gradcam_visualisation_scores_equal.pkl')
table_diff.to_pickle('./' + model_name + '_gradcam_visualisation_scores_diff.pkl')

# Creating Benchmarks

## By concatenation of all models

In [89]:
def lt_format(results_performance, col_n):
    results_mean = results_performance.groupby(col_n).mean()
    results_std = results_performance.groupby(col_n).std()
    
    results_mean.loc['mean'] = results_mean.mean()
    results_std.loc['mean'] = results_std.mean()
    for col in results_performance.columns.to_list():
        results_mean[col] = results_mean[col].apply(lambda x: f'{np.round(x,decimals=2)} $\pm$ ')
        results_std[col] = results_std[col].apply(lambda x: f'{np.round(x,decimals=2)}')
    
    return results_mean + results_std

model_names = glob.glob('/home/ubuntu/store/efficientnet-final-size/*h5')
results_actual = pd.DataFrame()
results_pred = pd.DataFrame()
results_equal = pd.DataFrame()
results_diff = pd.DataFrame()
results_performance = pd.DataFrame()

for mn in sorted(model_names):
    model_name = Path(mn).stem
    performance = pd.read_pickle('./' + model_name + '_performance.pkl')
    actual = pd.read_pickle('./' + model_name + '_gradcam_visualisation_scores_actual.pkl').loc[:,['recall','specificity','dice']]
    pred = pd.read_pickle('./' + model_name + '_gradcam_visualisation_scores_pred.pkl').loc[:,['recall','specificity','dice']]
    equal = pd.read_pickle('./' + model_name + '_gradcam_visualisation_scores_equal.pkl').loc[:,['recall','specificity','dice']]
    diff = pd.read_pickle('./' + model_name + '_gradcam_visualisation_scores_diff.pkl').loc[:,['recall','specificity','dice']]
    
    performance=performance.drop('mean')
    actual = actual.drop('mean')
    pred = pred.drop('mean')
    equal = equal.drop('mean')
    diff = diff.drop('mean')
    
    results_performance = pd.concat([results_performance, performance])
    results_actual = pd.concat([results_actual, actual])
    results_pred = pd.concat([results_pred, pred]) 
    results_diff = pd.concat([results_diff, diff])

results_performance.index.name = 'label'

table_performance = lt_format(results_performance, 'label')
table_actual = lt_format(results_actual, 'characteristic')

In [90]:
table_performance = table_performance.drop(columns = ['accuracy'])

In [91]:
table_performance

Unnamed: 0_level_0,precision,f1-score,specificity
label,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
acne,0.77 $\pm$ 0.16,0.65 $\pm$ 0.32,0.97 $\pm$ 0.02
actinic_keratosis,0.74 $\pm$ 0.08,0.55 $\pm$ 0.11,0.96 $\pm$ 0.02
psoriasis_no_pustular,0.43 $\pm$ 0.14,0.57 $\pm$ 0.12,0.67 $\pm$ 0.23
seborrheic_dermatitis,0.62 $\pm$ 0.08,0.45 $\pm$ 0.22,0.95 $\pm$ 0.03
vitiligo,0.0 $\pm$ 0.01,0.0 $\pm$ 0.01,0.9 $\pm$ 0.03
wart,0.08 $\pm$ 0.04,0.07 $\pm$ 0.04,0.86 $\pm$ 0.04
mean,0.44 $\pm$ 0.08,0.38 $\pm$ 0.14,0.89 $\pm$ 0.06


In [87]:
print(table_performance.to_latex())

\begin{tabular}{llll}
\toprule
{} &        precision &         f1-score &      specificity \\
label                 &                  &                  &                  \\
\midrule
acne                  &  0.77 \$\textbackslash pm\$ 0.16 &  0.65 \$\textbackslash pm\$ 0.32 &  0.97 \$\textbackslash pm\$ 0.02 \\
actinic\_keratosis     &  0.74 \$\textbackslash pm\$ 0.08 &  0.55 \$\textbackslash pm\$ 0.11 &  0.96 \$\textbackslash pm\$ 0.02 \\
psoriasis\_no\_pustular &  0.43 \$\textbackslash pm\$ 0.14 &  0.57 \$\textbackslash pm\$ 0.12 &  0.67 \$\textbackslash pm\$ 0.23 \\
seborrheic\_dermatitis &  0.62 \$\textbackslash pm\$ 0.08 &  0.45 \$\textbackslash pm\$ 0.22 &  0.95 \$\textbackslash pm\$ 0.03 \\
vitiligo              &   0.0 \$\textbackslash pm\$ 0.01 &   0.0 \$\textbackslash pm\$ 0.01 &   0.9 \$\textbackslash pm\$ 0.03 \\
wart                  &  0.08 \$\textbackslash pm\$ 0.04 &  0.07 \$\textbackslash pm\$ 0.04 &  0.86 \$\textbackslash pm\$ 0.04 \\
mean                  &  0.44 \

In [39]:
table_actual

Unnamed: 0_level_0,recall,specificity,dice
characteristic,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1
closed-comedo,0.21 $\pm$ 0.1,0.83 $\pm$ 0.04,0.08 $\pm$ 0.03
cyst,0.2 $\pm$ 0.14,0.85 $\pm$ 0.03,0.02 $\pm$ 0.01
dermatoglyph-disruption,0.09 $\pm$ 0.05,0.79 $\pm$ 0.06,0.05 $\pm$ 0.02
leukotrichia,0.14 $\pm$ 0.1,0.82 $\pm$ 0.04,0.07 $\pm$ 0.03
macule,0.27 $\pm$ 0.07,0.8 $\pm$ 0.03,0.09 $\pm$ 0.03
nodule,0.2 $\pm$ 0.08,0.82 $\pm$ 0.03,0.03 $\pm$ 0.01
open-comedo,0.19 $\pm$ 0.1,0.83 $\pm$ 0.04,0.08 $\pm$ 0.04
papule,0.23 $\pm$ 0.07,0.8 $\pm$ 0.03,0.07 $\pm$ 0.01
patch,0.28 $\pm$ 0.06,0.8 $\pm$ 0.03,0.21 $\pm$ 0.04
plaque,0.38 $\pm$ 0.03,0.81 $\pm$ 0.04,0.29 $\pm$ 0.01


In [40]:
print(table_actual[['dice','recall','specificity']].to_latex())

\begin{tabular}{llll}
\toprule
{} &             dice &           recall &      specificity \\
characteristic          &                  &                  &                  \\
\midrule
closed-comedo           &  0.08 \$\textbackslash pm\$ 0.03 &   0.21 \$\textbackslash pm\$ 0.1 &  0.83 \$\textbackslash pm\$ 0.04 \\
cyst                    &  0.02 \$\textbackslash pm\$ 0.01 &   0.2 \$\textbackslash pm\$ 0.14 &  0.85 \$\textbackslash pm\$ 0.03 \\
dermatoglyph-disruption &  0.05 \$\textbackslash pm\$ 0.02 &  0.09 \$\textbackslash pm\$ 0.05 &  0.79 \$\textbackslash pm\$ 0.06 \\
leukotrichia            &  0.07 \$\textbackslash pm\$ 0.03 &   0.14 \$\textbackslash pm\$ 0.1 &  0.82 \$\textbackslash pm\$ 0.04 \\
macule                  &  0.09 \$\textbackslash pm\$ 0.03 &  0.27 \$\textbackslash pm\$ 0.07 &   0.8 \$\textbackslash pm\$ 0.03 \\
nodule                  &  0.03 \$\textbackslash pm\$ 0.01 &   0.2 \$\textbackslash pm\$ 0.08 &  0.82 \$\textbackslash pm\$ 0.03 \\
open-comedo          