# Data loading pipeline examples

The purpose of this notebook is to illustrate reading Nifti files and test speed of different methods.

[![Open In Colab](https://colab.research.google.com/assets/colab-badge.svg)](https://colab.research.google.com/github/Project-MONAI/tutorials/blob/master/acceleration/transform_speed.ipynb)

## Setup environment

In [1]:
!python -c "import monai" || pip install -q "monai-weekly[nibabel]"

## Setup imports

In [2]:
# Copyright 2020 MONAI Consortium
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import glob
import os
import shutil
import tempfile

import nibabel as nib
import numpy as np
import torch

try:
    torch.multiprocessing.set_start_method("spawn")
except RuntimeError:
    pass


from monai.config import print_config
from monai.data import ArrayDataset, create_test_image_3d
from monai.transforms import (
    AddChannel,
    Compose,
    LoadImage,
    RandAffine,
    RandSpatialCrop,
    Rotate,
    ScaleIntensity,
    EnsureType,
)
from monai.utils import first

print_config()

MONAI version: 0.4.0+35.g6adbcde
Numpy version: 1.19.5
Pytorch version: 1.7.1
MONAI flags: HAS_EXT = False, USE_COMPILED = False
MONAI rev id: 6adbcdee45c16f18f5b713575af3410437177311

Optional dependencies:
Pytorch Ignite version: 0.4.2
Nibabel version: 3.2.1
scikit-image version: 0.18.1
Pillow version: 7.0.0
Tensorboard version: 2.2.0
gdown version: 3.12.2
TorchVision version: 0.8.2
ITK version: 5.1.2
tqdm version: 4.51.0
lmdb version: 1.0.0
psutil version: 5.8.0

For details about installing the optional dependencies, please visit:
    https://docs.monai.io/en/latest/installation.html#installing-the-recommended-dependencies



## Setup data directory

You can specify a directory with the `MONAI_DATA_DIRECTORY` environment variable.  
This allows you to save results and reuse downloads.  
If not specified a temporary directory will be used.

In [3]:
directory = os.environ.get("MONAI_DATA_DIRECTORY")
if directory:
    directory = os.path.join(directory, "transform_speed")
    os.makedirs(directory, exist_ok=True)
root_dir = tempfile.mkdtemp() if directory is None else directory
print(root_dir)

/workspace/data/medical


### 0. Preparing input data (nifti images)

Create a number of test Nifti files, 3d single channel images with spatial size (256, 256, 256) voxels.

In [4]:
for i in range(5):
    im, seg = create_test_image_3d(256, 256, 256)

    n = nib.Nifti1Image(im, np.eye(4))
    nib.save(n, os.path.join(root_dir, f"im{i}.nii.gz"))

    n = nib.Nifti1Image(seg, np.eye(4))
    nib.save(n, os.path.join(root_dir, f"seg{i}.nii.gz"))

In [5]:
# prepare list of image names and segmentation names
images = sorted(glob.glob(os.path.join(root_dir, "im*.nii.gz")))
segs = sorted(glob.glob(os.path.join(root_dir, "seg*.nii.gz")))

### 1. Test image loading with minimal preprocessing

In [6]:
imtrans = Compose([LoadImage(image_only=True), AddChannel(), EnsureType()])

segtrans = Compose([LoadImage(image_only=True), AddChannel(), EnsureType()])

ds = ArrayDataset(images, imtrans, segs, segtrans)
loader = torch.utils.data.DataLoader(ds, batch_size=3, num_workers=8)

im, seg = first(loader)
print(im.shape, seg.shape)

torch.Size([3, 1, 256, 256, 256]) torch.Size([3, 1, 256, 256, 256])


In [7]:
%time data = next(iter(loader))

CPU times: user 23.3 ms, sys: 133 ms, total: 156 ms
Wall time: 8.6 s


### 2. Test image-patch loading with CPU multi-processing:

- rotate (256, 256, 256)-voxel in the plane axes=(1, 2)
- extract random (64, 64, 64) patches
- implemented in MONAI using ` scipy.ndimage.rotate`

In [8]:
images = sorted(glob.glob(os.path.join(root_dir, "im*.nii.gz")))
segs = sorted(glob.glob(os.path.join(root_dir, "seg*.nii.gz")))

imtrans = Compose(
    [
        LoadImage(image_only=True),
        ScaleIntensity(),
        AddChannel(),
        Rotate(angle=np.pi / 4),
        RandSpatialCrop((64, 64, 64), random_size=False),
        EnsureType(),
    ]
)

segtrans = Compose(
    [
        LoadImage(image_only=True),
        AddChannel(),
        Rotate(angle=np.pi / 4),
        RandSpatialCrop((64, 64, 64), random_size=False),
        EnsureType(),
    ]
)

ds = ArrayDataset(images, imtrans, segs, segtrans)
loader = torch.utils.data.DataLoader(
    ds, batch_size=3, num_workers=8, pin_memory=torch.cuda.is_available()
)

im, seg = first(loader)
print(im.shape, seg.shape)

torch.Size([3, 1, 64, 64, 64]) torch.Size([3, 1, 64, 64, 64])


In [9]:
%time data = next(iter(loader))

CPU times: user 20.4 ms, sys: 1.07 s, total: 1.09 s
Wall time: 22.6 s


(the above results were based on Intel(R) Xeon(R) CPU E5-2650 v4 @ 2.20GHz)

### 3. Test image-patch loading with preprocessing on GPU:

- random rotate (256, 256, 256)-voxel in the plane axes=(1, 2)
- extract random (64, 64, 64) patches
- implemented in MONAI using native pytorch resampling

In [10]:
images = sorted(glob.glob(os.path.join(root_dir, "im*.nii.gz")))
segs = sorted(glob.glob(os.path.join(root_dir, "seg*.nii.gz")))

# same parameter with different interpolation mode for image and segmentation
rand_affine_img = RandAffine(
    prob=1.0,
    rotate_range=np.pi / 4,
    translate_range=(96, 96, 96),
    spatial_size=(64, 64, 64),
    mode="bilinear",
    as_tensor_output=True,
    device=torch.device("cuda:0"),
)
rand_affine_seg = RandAffine(
    prob=1.0,
    rotate_range=np.pi / 4,
    translate_range=(96, 96, 96),
    spatial_size=(64, 64, 64),
    mode="nearest",
    as_tensor_output=True,
    device=torch.device("cuda:0"),
)

imtrans = Compose(
    [LoadImage(image_only=True), ScaleIntensity(),
     AddChannel(), rand_affine_img, EnsureType()]
)

segtrans = Compose([LoadImage(image_only=True),
                    AddChannel(), rand_affine_seg, EnsureType()])

ds = ArrayDataset(images, imtrans, segs, segtrans)
loader = torch.utils.data.DataLoader(ds, batch_size=3, num_workers=0)

im, seg = first(loader)

print(im.shape, seg.shape)

torch.Size([3, 1, 64, 64, 64]) torch.Size([3, 1, 64, 64, 64])


In [11]:
%time data = next(iter(loader))

CPU times: user 3.25 s, sys: 1.06 s, total: 4.31 s
Wall time: 4.31 s


In [12]:
print(torch.cuda.get_device_name(0))
print(torch.cuda.memory_summary(0, abbreviated=True))

Tesla V100-SXM3-32GB
|                  PyTorch CUDA memory summary, device ID 0                 |
|---------------------------------------------------------------------------|
|            CUDA OOMs: 0            |        cudaMalloc retries: 0         |
|        Metric         | Cur Usage  | Peak Usage | Tot Alloc  | Tot Freed  |
|---------------------------------------------------------------------------|
| Allocated memory      |   12288 KB |   88064 KB |    1188 MB |    1176 MB |
|---------------------------------------------------------------------------|
| Active memory         |   12288 KB |   88064 KB |    1188 MB |    1176 MB |
|---------------------------------------------------------------------------|
| GPU reserved memory   |  159744 KB |  159744 KB |  159744 KB |       0 B  |
|---------------------------------------------------------------------------|
| Non-releasable memory |    8192 KB |   77823 KB |     833 MB |     825 MB |
|------------------------------------------

## Cleanup data directory

Remove directory if a temporary was used.

In [13]:
if directory is None:
    shutil.rmtree(root_dir)