# CPTAC-PDA image conversion

> Convert svs files to zarr files

***

In [None]:
# Install zarr and load packages
!pip install -qq zarr
import tifffile, cv2, zarr
from pathlib import Path
import matplotlib.pyplot as plt
from tqdm.notebook import tqdm

In [None]:
# Settings
scale = 2
path = Path('../input/cptacpda')
files = [f for f in path.iterdir() if f.suffix=='.svs']
g_data = zarr.group(f'images_scale{scale}')

In [None]:
# Loop over files
for f in tqdm(files):
    print(f.name)
    img = tifffile.imread(f)
    
    if scale!=1:
        new_size = (img.shape[1] // scale, img.shape[0] // scale)
        print(f'Resizing from {img.shape[:2]} to {new_size}')
        img = cv2.resize(img, new_size)
    
    g_data[f.stem] = img
    print(g_data[f.stem].info)
    
    print('Plotting')
    fig, ax = plt.subplots(figsize=(15,15))
    shape = img.shape
    ax.imshow(cv2.resize(img, (1024, 1024*shape[0]//shape[1])))
    plt.show()