/
prepare_mini_imagenet.py
57 lines (46 loc) · 1.88 KB
/
prepare_mini_imagenet.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
"""
Run this script to prepare the miniImageNet dataset.
This script uses the 100 classes of 600 images each used in the Matching Networks paper. The exact images used are
given in data/mini_imagenet.txt which is downloaded from the link provided in the paper (https://goo.gl/e3orz6).
1. Download files from https://drive.google.com/file/d/0B3Irx3uQNoBMQ1FlNXJsZUdYWEE/view and place in
data/miniImageNet/images
2. Run the script
"""
from tqdm import tqdm as tqdm
import numpy as np
import shutil
import os
from config import DATA_PATH
from few_shot.utils import mkdir, rmdir
# Clean up folders
rmdir(DATA_PATH + '/miniImageNet/images_background')
rmdir(DATA_PATH + '/miniImageNet/images_evaluation')
mkdir(DATA_PATH + '/miniImageNet/images_background')
mkdir(DATA_PATH + '/miniImageNet/images_evaluation')
# Find class identities
classes = []
for root, _, files in os.walk(DATA_PATH + '/miniImageNet/images/'):
for f in files:
if f.endswith('.jpg'):
classes.append(f[:-12])
classes = list(set(classes))
# Train/test split
np.random.seed(0)
np.random.shuffle(classes)
background_classes, evaluation_classes = classes[:80], classes[80:]
# Create class folders
for c in background_classes:
mkdir(DATA_PATH + f'/miniImageNet/images_background/{c}/')
for c in evaluation_classes:
mkdir(DATA_PATH + f'/miniImageNet/images_evaluation/{c}/')
# Move images to correct location
for root, _, files in os.walk(DATA_PATH + '/miniImageNet/images'):
for f in tqdm(files, total=600*100):
if f.endswith('.jpg'):
class_name = f[:-12]
image_name = f[-12:]
# Send to correct folder
subset_folder = 'images_evaluation' if class_name in evaluation_classes else 'images_background'
src = f'{root}/{f}'
dst = DATA_PATH + f'/miniImageNet/{subset_folder}/{class_name}/{image_name}'
shutil.copy(src, dst)