In [None]:
from google.colab import drive
drive.mount('/content/drive')

Mounted at /content/drive


In [None]:

import os
import pickle
import cv2
from tqdm import tqdm
from pathlib import Path
import imageio as iio
import imgaug.augmenters as ia
import imgaug
import numpy as np
from PIL import Image, ImageOps

In [None]:
data_dir = '/content/drive/MyDrive/TRECVID/Dataset'

class_names = sorted(os.listdir(data_dir))
print("Class Names:", class_names)
print("Number of classes: ", len(class_names))

Class Names: ['calloused_hands_baseball_field', 'calloused_hands_car', 'calloused_hands_diner', 'calloused_hands_josh_s_house', 'calloused_hands_rabbi_s_house', 'calloused_hands_school', 'calloused_hands_synagogue', 'chained_for_life_garden', 'chained_for_life_hospital', 'chained_for_life_hotel', 'liberty_kid_carnival', 'liberty_kid_house1', 'liberty_kid_house2', 'liberty_kid_prison', 'liberty_kid_statue_of_liberty', 'like_me_diner', 'like_me_gas_station', 'like_me_motel', 'little_rock_caravan', 'little_rock_fun_place', 'little_rock_gallery', 'little_rock_house1', 'little_rock_house2', 'little_rock_motel', 'little_rock_shop', 'losing_ground_home1', 'losing_ground_home2', 'losing_ground_neighbourhood', 'losing_ground_rental_house', 'losing_ground_rooftop', 'losing_ground_university-workplace']
Number of classes:  31


In [None]:
source = '/content/drive/MyDrive/TRECVID/Dataset'
target = '/content/drive/MyDrive/TRECVID/datadir'

In [None]:
iter = ['/' + class_name for class_name in class_names]
print(iter)

['/calloused_hands_baseball_field', '/calloused_hands_car', '/calloused_hands_diner', '/calloused_hands_josh_s_house', '/calloused_hands_rabbi_s_house', '/calloused_hands_school', '/calloused_hands_synagogue', '/chained_for_life_garden', '/chained_for_life_hospital', '/chained_for_life_hotel', '/liberty_kid_carnival', '/liberty_kid_house1', '/liberty_kid_house2', '/liberty_kid_prison', '/liberty_kid_statue_of_liberty', '/like_me_diner', '/like_me_gas_station', '/like_me_motel', '/little_rock_caravan', '/little_rock_fun_place', '/little_rock_gallery', '/little_rock_house1', '/little_rock_house2', '/little_rock_motel', '/little_rock_shop', '/losing_ground_home1', '/losing_ground_home2', '/losing_ground_neighbourhood', '/losing_ground_rental_house', '/losing_ground_rooftop', '/losing_ground_university-workplace']


In [None]:
# Creating folder
for class_name in class_names:
  try:
    os.mkdir(target + '/' + class_name)
    print(f'Make dir {class_name} successful!')
  except:
    pass

## Sequence transform

### Augmentation

In [None]:
sometimes = lambda aug: ia.Sometimes(0.5, aug)

# Define our sequence of augmentation steps that will be applied to every image.
seq = ia.Sequential(
    [
        #
        # Apply the following augmenters to most images.
        #
        #ia.Fliplr(0.5), # horizontally flip 50% of all images
        #ia.Flipud(0.2), # vertically flip 20% of all images

        # crop some of the images by 0-10% of their height/width
        #sometimes(ia.Crop(percent=(0, 0.1))),

        # Apply affine transformations to some of the images
        # - scale to 80-120% of image height/width (each axis independently)
        # - translate by -20 to +20 relative to height/width (per axis)
        # - rotate by -45 to +45 degrees
        # - shear by -16 to +16 degrees
        # - order: use nearest neighbour or bilinear interpolation (fast)
        # - mode: use any available mode to fill newly created pixels
        #         see API or scikit-image for which modes are available
        # - cval: if the mode is constant, then use a random brightness
        #         for the newly created pixels (e.g. sometimes black,
        #         sometimes white)
        sometimes(ia.Affine(
            #scale={"x": (0.8, 1.2), "y": (0.8, 1.2)},
            translate_percent={"x": (-0.2, 0.2), "y": (-0.2, 0.2)},
            #rotate=(-45, 45),
            shear=(-16, 16),
            order=[0, 1],
            cval=(0, 255),
            mode=imgaug.ALL
        )),

        #
        # Execute 0 to 5 of the following (less important) augmenters per
        # image. Don't execute all of them, as that would often be way too
        # strong.
        #
        ia.SomeOf((0, 5),
            [
                # Convert some images into their superpixel representation,
                # sample between 20 and 200 superpixels per image, but do
                # not replace all superpixels with their average, only
                # some of them (p_replace).
                sometimes(
                    ia.Superpixels(
                        p_replace=(0, 1.0),
                        n_segments=(20, 200)
                    )
                ),

                # Blur each image with varying strength using
                # gaussian blur (sigma between 0 and 3.0),
                # average/uniform blur (kernel size between 2x2 and 7x7)
                # median blur (kernel size between 3x3 and 11x11).
                ia.OneOf([
                    ia.GaussianBlur((0, 3.0)),
                    ia.AverageBlur(k=(2, 7)),
                    ia.MedianBlur(k=(3, 11)),
                ]),

                # Sharpen each image, overlay the result with the original
                # image using an alpha between 0 (no sharpening) and 1
                # (full sharpening effect).
                ia.Sharpen(alpha=(0, 1.0), lightness=(0.75, 1.5)),

                # Same as sharpen, but for an embossing effect.
                ia.Emboss(alpha=(0, 1.0), strength=(0, 2.0)),

                # Search in some images either for all edges or for
                # directed edges. These edges are then marked in a black
                # and white image and overlayed with the original image
                # using an alpha of 0 to 0.7.
                sometimes(ia.OneOf([
                    ia.EdgeDetect(alpha=(0, 0.7)),
                    ia.DirectedEdgeDetect(
                        alpha=(0, 0.7), direction=(0.0, 1.0)
                    ),
                ])),

                # Add gaussian noise to some images.
                # In 50% of these cases, the noise is randomly sampled per
                # channel and pixel.
                # In the other 50% of all cases it is sampled once per
                # pixel (i.e. brightness change).
                ia.AdditiveGaussianNoise(
                    loc=0, scale=(0.0, 0.05*255), per_channel=0.5
                ),

                # Either drop randomly 1 to 10% of all pixels (i.e. set
                # them to black) or drop them on an image with 2-5% percent
                # of the original size, leading to large dropped
                # rectangles.
                ia.OneOf([
                    ia.Dropout((0.01, 0.1), per_channel=0.5),
                    ia.CoarseDropout(
                        (0.03, 0.15), size_percent=(0.02, 0.05),
                        per_channel=0.2
                    ),
                ]),

                # Invert each image's channel with 5% probability.
                # This sets each pixel value v to 255-v.
                #ia.Invert(0.05, per_channel=True), # invert color channels

                # Add a value of -10 to 10 to each pixel.
                #ia.Add((-10, 10), per_channel=0.5),

                # Change brightness of images (50-150% of original value).
                ia.Multiply((0.5, 1.5), per_channel=0.5),

                # Improve or worsen the contrast of images.
                ia.LinearContrast((0.5, 2.0), per_channel=0.5),

                # Convert each image to grayscale and then overlay the
                # result with the original with random alpha. I.e. remove
                # colors with varying strengths.
                #ia.Grayscale(alpha=(0.0, 1.0)),

                # In some images move pixels locally around (with random
                # strengths).
                sometimes(
                    ia.ElasticTransformation(alpha=(0.5, 3.5), sigma=0.25)
                ),

                # In some images distort local areas with varying strength.
                # sometimes(ia.PiecewiseAffine(scale=(0.01, 0.05)))
            ],
            # do all of the above augmentations in random order
            random_order=True
        )
    ],
    # do all of the above augmentations in random order
    random_order=True)
def sequence():
    for i in iter:
        count = 0
        for file in Path(source + "/" + i).iterdir():
            img = iio.imread(file)
            count += 1
            for k in range(500):
                imgnew = seq.augment_image(img);
                iio.imwrite(target + '/' + i + '/' + str(count) + "_v" + str(k) + '.JPG', imgnew)
            iio.imwrite(target + '/' + i + '/' + str(count) + '.JPG', img)

In [None]:
def sequence():
    for i in iter:
        if len(os.listdir(Path(target + "/" + i))):
          continue
        count = 0
        for file in Path(source + "/" + i).iterdir():
            img = iio.imread(file)
            count += 1
            for k in tqdm(range(500)):
                imgnew = seq.augment_image(img);
                imgnew = cv2.cvtColor(imgnew, cv2.COLOR_RGBA2RGB)
                iio.imwrite(target + '/' + i + '/' + str(count) + "_v" + str(k) + '.JPG', imgnew)
        #     iio.imwrite(target + '/' + i + '/' + str(count) + '.JPG', img)

In [None]:
sequence()

  img = iio.imread(file)
100%|██████████| 500/500 [00:07<00:00, 66.50it/s]
100%|██████████| 500/500 [00:08<00:00, 59.29it/s]
100%|██████████| 500/500 [00:07<00:00, 64.35it/s]
100%|██████████| 500/500 [00:07<00:00, 62.58it/s]
100%|██████████| 500/500 [00:08<00:00, 56.79it/s]
100%|██████████| 500/500 [00:07<00:00, 65.10it/s]
100%|██████████| 500/500 [00:08<00:00, 58.89it/s]
100%|██████████| 500/500 [00:07<00:00, 66.27it/s]
100%|██████████| 500/500 [00:08<00:00, 60.10it/s]
100%|██████████| 500/500 [00:07<00:00, 65.23it/s]
100%|██████████| 500/500 [00:08<00:00, 59.29it/s]
100%|██████████| 500/500 [00:31<00:00, 15.75it/s]
100%|██████████| 500/500 [00:21<00:00, 22.82it/s]
100%|██████████| 500/500 [00:21<00:00, 22.73it/s]
100%|██████████| 500/500 [00:28<00:00, 17.71it/s]
100%|██████████| 500/500 [00:23<00:00, 21.49it/s]
100%|██████████| 500/500 [00:40<00:00, 12.41it/s]
100%|██████████| 500/500 [00:22<00:00, 22.54it/s]
100%|██████████| 500/500 [00:23<00:00, 21.12it/s]
100%|██████████| 500/500 

In [None]:
import torch
import torch.nn as nn
import torch.optim as optim
from torch.optim import lr_scheduler
import numpy as np
import torchvision
from torchvision import datasets, models, transforms
from torch.utils.data import random_split
import matplotlib.pyplot as plt
import time
import os
import copy

In [None]:
import random
import shutil

train_dir = '/content/datadir/train'
valid_dir = '/content/datadir/valid'

# Create output folders if they don't exist
os.makedirs(train_dir, exist_ok=True)
os.makedirs(valid_dir, exist_ok=True)

# Iterate through each class folder in the input folder
for class_folder in os.listdir(target):
    class_path = os.path.join(target, class_folder)

    # Skip non-directory entries
    if not os.path.isdir(class_path):
        continue

    # List all files in the class folder
    files = os.listdir(class_path)

    # Shuffle the files with a fixed seed for reproducibility
    random.seed(0)
    random.shuffle(files)

    # Calculate the split index based on the split ratio
    split_index = int(len(files) * 0.8)

    # Split the files into training and validation sets
    train_files = files[:split_index]
    valid_files = files[split_index:]

    # Move files to the corresponding output folders
    for file in train_files:
        src_path = os.path.join(class_path, file)
        dest_path = os.path.join(train_dir, class_folder, file)
        os.makedirs(os.path.dirname(dest_path), exist_ok=True)
        shutil.copy(src_path, dest_path)

    for file in valid_files:
        src_path = os.path.join(class_path, file)
        dest_path = os.path.join(valid_dir, class_folder, file)
        os.makedirs(os.path.dirname(dest_path), exist_ok=True)
        shutil.copy(src_path, dest_path)