__Note__: The code used here was heavily inspired by the AI for Medicine Specialization Course 1 Week three programming assignments: [link](https://www.coursera.org/learn/ai-for-medical-diagnosis)

In [1]:
import numpy as np
import nibabel as nib
import matplotlib.pyplot as plt
import json
import os
from pprint import pprint
from collections import OrderedDict
from ipywidgets import interact, interactive, IntSlider, ToggleButtons
from sys import getsizeof
from tqdm import tqdm

### Reading dataset description

In [2]:
file = open('../datasets_descriptions_json/task09_spleen_dataset.json')
data_description = json.load(file)

In [3]:
print(json.dumps(data_description, indent=4))

{
    "name": "Spleen",
    "description": "Spleen Segmentation",
    "reference": "Memorial Sloan Kettering Cancer Center",
    "licence": "CC-BY-SA 4.0",
    "release": "1.0 06/08/2018",
    "tensorImageSize": "3D",
    "modality": {
        "0": "CT"
    },
    "labels": {
        "0": "background",
        "1": "spleen"
    },
    "numTraining": 41,
    "numTest": 20,
    "training": [
        {
            "image": "./imagesTr/spleen_19.nii.gz",
            "label": "./labelsTr/spleen_19.nii.gz"
        },
        {
            "image": "./imagesTr/spleen_31.nii.gz",
            "label": "./labelsTr/spleen_31.nii.gz"
        },
        {
            "image": "./imagesTr/spleen_52.nii.gz",
            "label": "./labelsTr/spleen_52.nii.gz"
        },
        {
            "image": "./imagesTr/spleen_40.nii.gz",
            "label": "./labelsTr/spleen_40.nii.gz"
        },
        {
            "image": "./imagesTr/spleen_3.nii.gz",
            "label": "./labelsTr/spleen_3.nii.gz"


### Reading and visualizing spleen_2 nifti CT and mask files

#### CT file

In [4]:
ct_1 = nib.load("../../datasets/Task09_Spleen/train/images/spleen_2.nii.gz")

In [5]:
type(ct_1)

nibabel.nifti1.Nifti1Image

In [6]:
# Read Nifi Image object as numpy file
ct_1 = ct_1.get_fdata()

In [7]:
type(ct_1)

numpy.ndarray

In [8]:
ct_1.dtype

dtype('float64')

In [9]:
ct_1.shape

(512, 512, 90)

In [10]:
# Range of voxel values (maximum value - minimum value)
print(ct_1[:, :, :].ptp())

4095.0


In [11]:
getsizeof(ct_1) # 188.743808 MBs

188743808

In [12]:
getsizeof(ct_1.astype(np.float32)) # 94.371968 MBs

94371968

In [13]:
getsizeof(ct_1.astype(np.float16)) # 47.186048 MBs

47186048

#### Mask file

In [14]:
ct_1_mask = nib.load("../../datasets/Task09_Spleen/train/masks/spleen_2.nii.gz")

In [15]:
ct_1_mask = ct_1_mask.get_fdata()

In [16]:
ct_1_mask.dtype

dtype('float64')

In [17]:
getsizeof(ct_1_mask) # 188.743808 MBs

188743808

In [18]:
getsizeof(ct_1_mask.astype(np.float32)) # 94.371968 MBs

94371968

In [19]:
getsizeof(ct_1_mask.astype(np.uint8)) # 23.593088 MBs

23593088

In [20]:
ct_1_mask = ct_1_mask.astype(np.float32)

In [21]:
ct_1_mask.shape

(512, 512, 90)

### Visualizing nifti CT file and Mask file

In [22]:
# Create layer slider
select_layer = IntSlider(min=0, max=ct_1.shape[2] - 1, description='Select Layer', continuous_update=False)

    
# Define a function for plotting images
def plot(layer):
    print(f"Plotting Layer: {layer}")
    fig = plt.figure(figsize=(20, 10))
    
    fig.add_subplot(1, 2, 1)
    plt.imshow(ct_1[:, :, layer], cmap='gray');
    plt.title("ct", fontsize=20)
    plt.axis('off')
    
    fig.add_subplot(1, 2, 2)
    plt.title("Mask", fontsize=20)
    plt.imshow(ct_1_mask[:, :, layer], cmap='gray')
    plt.axis('off');

# Use the interactive() tool to create the visualization
interactive(plot, layer=select_layer)

interactive(children=(IntSlider(value=0, continuous_update=False, description='Select Layer', max=89), Output(…

### Reading and visualizing spleen_3 nifti CT and mask files

#### CT file

In [23]:
ct_2 = nib.load("../../datasets/Task09_Spleen/train/images/spleen_3.nii.gz")

In [24]:
type(ct_2)

nibabel.nifti1.Nifti1Image

In [25]:
# Read Nifi Image object as numpy file
ct_2 = ct_2.get_fdata()

In [26]:
type(ct_2)

numpy.ndarray

In [27]:
ct_2.dtype

dtype('float64')

In [28]:
ct_2.shape

(512, 512, 40)

In [29]:
# Range of voxel values (maximum value - minimum value)
print(ct_2[:, :, :].ptp())

2370.0


#### Mask file

In [30]:
ct_2_mask = nib.load("../../datasets/Task09_Spleen/train/masks/spleen_3.nii.gz")

In [31]:
ct_2_mask = ct_2_mask.get_fdata()

In [32]:
ct_2_mask.dtype

dtype('float64')

In [33]:
ct_2_mask = ct_2_mask.astype(np.float32)

In [34]:
ct_2_mask.shape

(512, 512, 40)

### Visualizing nifti CT file and Mask file

In [35]:
# Create layer slider
select_layer = IntSlider(min=0, max=ct_2.shape[2] - 1, description='Select Layer', continuous_update=False)

    
# Define a function for plotting images
def plot(layer):
    print(f"Plotting Layer: {layer}")
    fig = plt.figure(figsize=(20, 10))
    
    fig.add_subplot(1, 2, 1)
    plt.imshow(ct_2[:, :, layer], cmap='gray');
    plt.title("ct", fontsize=20)
    plt.axis('off')
    
    fig.add_subplot(1, 2, 2)
    plt.title("Mask", fontsize=20)
    plt.imshow(ct_2_mask[:, :, layer], cmap='gray')
    plt.axis('off');

# Use the interactive() tool to create the visualization
interactive(plot, layer=select_layer)

interactive(children=(IntSlider(value=0, continuous_update=False, description='Select Layer', max=39), Output(…

### Reading and visualizing spleen_6 nifti CT and mask files

#### CT file

In [36]:
ct_3 = nib.load("../../datasets/Task09_Spleen/train/images/spleen_6.nii.gz")

In [37]:
type(ct_3)

nibabel.nifti1.Nifti1Image

In [38]:
# Read Nifi Image object as numpy file
ct_3 = ct_3.get_fdata()

In [39]:
type(ct_3)

numpy.ndarray

In [40]:
ct_3.dtype

dtype('float64')

In [41]:
ct_3.shape

(512, 512, 135)

In [42]:
# Range of voxel values (maximum value - minimum value)
print(ct_3[:, :, :].ptp())

2276.0


#### Mask file

In [43]:
ct_3_mask = nib.load("../../datasets/Task09_Spleen/train/masks/spleen_6.nii.gz")

In [44]:
ct_3_mask = ct_3_mask.get_fdata()

In [45]:
ct_3_mask.dtype

dtype('float64')

In [46]:
ct_3_mask = ct_3_mask.astype(np.float32)

In [47]:
ct_3_mask.shape

(512, 512, 135)

### Visualizing nifti CT file and Mask file

In [48]:
# Create layer slider
select_layer = IntSlider(min=0, max=ct_3.shape[2] - 1, description='Select Layer', continuous_update=False)

    
# Define a function for plotting images
def plot(layer):
    print(f"Plotting Layer: {layer}")
    fig = plt.figure(figsize=(20, 10))
    
    fig.add_subplot(1, 2, 1)
    plt.imshow(ct_3[:, :, layer], cmap='gray');
    plt.title("ct", fontsize=20)
    plt.axis('off')
    
    fig.add_subplot(1, 2, 2)
    plt.title("Mask", fontsize=20)
    plt.imshow(ct_3_mask[:, :, layer], cmap='gray')
    plt.axis('off');

# Use the interactive() tool to create the visualization
interactive(plot, layer=select_layer)

interactive(children=(IntSlider(value=0, continuous_update=False, description='Select Layer', max=134), Output…

### Calculating CT shape counter dictionary

In [49]:
data_dir = "../../datasets/Task09_Spleen/"

train_mri_paths = [os.path.join(data_dir + "train/images", x) for x in os.listdir(data_dir + "train/images")]
val_mri_paths = [os.path.join(data_dir + "val/images", x) for x in os.listdir(data_dir + "val/images")]
test_mri_paths = [os.path.join(data_dir + "test_images_for_model_prediction_submission", x) for x in os.listdir(data_dir + "test_images_for_model_prediction_submission")]

all_paths = train_mri_paths + val_mri_paths + test_mri_paths  # concatenate list of paths

shape_count_dict = {}

for path in tqdm(all_paths):
    mri = nib.load(path).get_fdata()
    shape = mri.shape
    
    if shape not in shape_count_dict.keys():
        shape_count_dict[shape] = 1
    else:
        shape_count_dict[shape] += 1   

100%|██████████| 61/61 [00:23<00:00,  2.56it/s]


In [50]:
shape_count_dict = OrderedDict(sorted(shape_count_dict.items(), key=lambda item: item[1], reverse=True))
pprint(shape_count_dict)

OrderedDict([((512, 512, 94), 3),
             ((512, 512, 44), 2),
             ((512, 512, 112), 2),
             ((512, 512, 61), 2),
             ((512, 512, 103), 2),
             ((512, 512, 168), 2),
             ((512, 512, 89), 2),
             ((512, 512, 50), 2),
             ((512, 512, 98), 2),
             ((512, 512, 48), 2),
             ((512, 512, 96), 2),
             ((512, 512, 54), 1),
             ((512, 512, 104), 1),
             ((512, 512, 41), 1),
             ((512, 512, 164), 1),
             ((512, 512, 95), 1),
             ((512, 512, 55), 1),
             ((512, 512, 100), 1),
             ((512, 512, 83), 1),
             ((512, 512, 40), 1),
             ((512, 512, 51), 1),
             ((512, 512, 77), 1),
             ((512, 512, 87), 1),
             ((512, 512, 90), 1),
             ((512, 512, 148), 1),
             ((512, 512, 135), 1),
             ((512, 512, 65), 1),
             ((512, 512, 93), 1),
             ((512, 512, 119), 1),
     

In [51]:
list_layers = []
for key, val in shape_count_dict.items():
    list_layers.append(key[2])

layers = np.array(list_layers)
print(layers.mean())
print(np.median(layers))
print(layers.min())
print(layers.max())

86.12244897959184
89.0
31
168
