In [3]:
from tensorflow.keras.utils import to_categorical
from sklearn.preprocessing import LabelBinarizer, LabelEncoder
from imutils import paths
import numpy as np
import os
import cv2
import shutil
from glob import glob

In [4]:
# list of images in the dataset directory
print("[INFO] loading training images...")
imagePaths = list(paths.list_images('covid19_dataset'))

# initialize the list of data (i.e., images) and class images
data_train = []
labels_train = []

# loop over the image paths
for imagePath in imagePaths:
    # extract the class label from the filename
    label = imagePath.split(os.path.sep)[-2]
    # load the image, swap color channels, and resize it to be a fixed
    # 224x224 pixels 
    image = cv2.imread(imagePath)
    image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
    image = cv2.resize(image, (224, 224))

    # Append to data and labels lists, respectively
    data_train.append(image)
    labels_train.append(label)

[INFO] loading training images...


In [5]:
# verify the length of lists
len(labels_train)

3000

In [6]:
# convert the data and labels to NumPy arrays and scale the pixel
# intensities to the range [0, 1]
data_train = np.array(data_train)/255.0 
labels_train = np.array(labels_train)

In [7]:
# perform one-hot encoding on the labels
le = LabelEncoder()
labels_train = le.fit_transform(labels_train)
labels_train = to_categorical(labels_train)

In [8]:
# save the training data in two numpy arrays
np.save('new_3000_data_train_224.npy', data_train)
np.save('new_3000_labels_train_224.npy', labels_train)