# Randomizing and reducing the data from 27563 photos to 1000 photos for the uninfected (from malaria) photos and parasitized photos. Each factor should have 500 photos.

### Uninfected with Malaria photos - Randomize

In [10]:
import os
import shutil
import random

# Input folder with all images
input_folder = "Dataset\\cell_images\\Uninfected"

# Output folder to store the randomly selected images
output_folder = "Dataset\clean\output_uninfected"  

# Create the output folder if it doesn't exist
if not os.path.exists(output_folder):
    os.makedirs(output_folder)

# List all files in the input folder
files = os.listdir(input_folder)

# Shuffle the list of files randomly
random.shuffle(files)

# Number of images to select (500 in this case)
num_images_to_select = 500

# Loop through the first 500 files (randomly shuffled)
for i in range(min(num_images_to_select, len(files))):
    # Get the file path of the current image
    image_path = os.path.join(input_folder, files[i])

    # Move the image to the output folder
    shutil.move(image_path, os.path.join(output_folder, files[i]))

print("Random selection complete.")


Random selection complete.


### Parasitized with Malaria photos - Randomize

In [11]:
# Input folder with all images
input_folder = "Dataset\\cell_images\\Parasitized"

# Output folder to store the randomly selected images
output_folder = "Dataset\clean\output_parasitized"  

# Create the output folder if it doesn't exist
if not os.path.exists(output_folder):
    os.makedirs(output_folder)

# List all files in the input folder
files = os.listdir(input_folder)

# Shuffle the list of files randomly
random.shuffle(files)

# Number of images to select (500 in this case)
num_images_to_select = 500

# Loop through the first 500 files (randomly shuffled)
for i in range(min(num_images_to_select, len(files))):
    # Get the file path of the current image
    image_path = os.path.join(input_folder, files[i])

    # Move the image to the output folder
    shutil.move(image_path, os.path.join(output_folder, files[i]))

print("Random selection complete.")

Random selection complete.


# Reprocessing the images to go from 150x150 to 25x25 and changing them from RGB to Black and White

### Uninfected with Malaria Photos - Processed

In [13]:
from PIL import Image

# Input and output folder paths
input_folder = "Dataset\clean\output_uninfected" 
output_folder = "Dataset\clean\output_uninfected_process"  

# Create the output folder if it doesn't exist
if not os.path.exists(output_folder):
    os.makedirs(output_folder)

# List all files in the input folder
files = os.listdir(input_folder)

# Loop through each file in the input folder
for file in files:
    # Check if the file is an image 
    if file.endswith((".jpg", ".jpeg", ".png", ".gif")):
        # Open the image
        image_path = os.path.join(input_folder, file)
        image = Image.open(image_path)

        # Resize the image to 25x25 pixels
        new_size = (25, 25)
        resized_image = image.resize(new_size)

        # Convert the image to black and white
        bw_image = resized_image.convert("L")

        # Save the resulting image in the output folder with the same filename
        output_path = os.path.join(output_folder, file)
        bw_image.save(output_path)

print("Conversion complete.")


Conversion complete.


### Parasitized with Malaria photos - Processed

In [14]:
# Input and output folder paths
input_folder = "Dataset\clean\output_parasitized" 
output_folder = "Dataset\clean\output_parasitized_process"  

# Create the output folder if it doesn't exist
if not os.path.exists(output_folder):
    os.makedirs(output_folder)

# List all files in the input folder
files = os.listdir(input_folder)

# Loop through each file in the input folder
for file in files:
    # Check if the file is an image 
    if file.endswith((".jpg", ".jpeg", ".png", ".gif")):
        # Open the image
        image_path = os.path.join(input_folder, file)
        image = Image.open(image_path)

        # Resize the image to 25x25 pixels
        new_size = (25, 25)
        resized_image = image.resize(new_size)

        # Convert the image to black and white
        bw_image = resized_image.convert("L")

        # Save the resulting image in the output folder with the same filename
        output_path = os.path.join(output_folder, file)
        bw_image.save(output_path)

print("Conversion complete.")

Conversion complete.
