# Inport needed package

- import os, sys # to add the parent directory to the path

In [2]:
import os
import sys
import time

- Using torchvision to create a dataset

In [3]:
# Using torchvision to create a dataset
import cv2
from torchvision import transforms
import torch
from torch.utils.data import random_split, DataLoader
import torchvision

import pandas as pd

- import self library

In [4]:
from train.trainer import ClassifierTrainer as Trainer
import dataset as ds  # type: ignore
import model as md  # type: ignore

# Define classification train process

1. Define place where the model is saved

In [12]:
time_str = time.strftime("%Y%m%d_%H%M%S")


2. Define train function

In [13]:
def doTheTrain(dataset, model):
  # define batch_size
  batch_size = 64

  # init train val test ds
  train_val_size = int(0.8 * len(dataset))
  test_size = len(dataset) - train_val_size
  train_ds, test_ds = random_split(dataset, [train_val_size, test_size])

  # define optimizer using Adam and loss function
  optimizer = torch.optim.Adam(model.parameters(), lr=0.001)
  loss_fn = torch.nn.CrossEntropyLoss()

  trainer = Trainer(model, optimizer, loss_fn, random_seed_value=86)
  print('device: ', trainer.device)
  avg_loss, metric = trainer.cross_validate(train_ds, k=5, epochs=10, batch_size=batch_size)
  print('avg_loss: ', avg_loss)

  # score model
  test_dataloader = DataLoader(test_ds, batch_size=batch_size, shuffle=True)
  model_scored = trainer.score(test_dataloader)
  print(f'model_scored: {model_scored:.4f}, avg_accuracy: {100*(1 - model_scored):.4f}')

  # return model scored, train_avg_lost
  return model_scored, avg_loss

3. execute progress

- define the model

In [None]:
models = [
	torchvision.models.resnet50(weights=torchvision.models.ResNet50_Weights.DEFAULT),
  torchvision.models.densenet121(weights=torchvision.models.DenseNet121_Weights.DEFAULT),
  torchvision.models.vgg16(weights=torchvision.models.VGG16_Weights.DEFAULT)
]



- Define tested datasets

In [15]:
datasets = {
    'gi4e_full': ds.Gi4eDataset(
        './datasets/gi4e',
        transform=transforms.Compose([transforms.ToPILImage(), transforms.Resize((224, 224)), transforms.ToTensor()]),
        is_classification=True),
    'gi4e_raw_eyes': ds.ImageDataset(
        './datasets/gi4e_raw_eyes',
        transform=transforms.Compose([transforms.Resize((224, 224)), transforms.ToTensor()]),
        file_extension='png'),
    'gi4e_detected_eyes': ds.ImageDataset(
        './datasets/gi4e_eyes/20250521_200316',
        transform=transforms.Compose([transforms.Resize((224, 224)), transforms.ToTensor()]),
        file_extension='png'),
}

- Train all defined model on each registered datasets

In [16]:
result_df = pd.DataFrame(columns=['dataset', 'model', 'avg_loss', 'avg_accuracy', 'total_time'])

for name, dataset in datasets.items():
	for model in models:
		print(f'Running {name} dataset with {model.__class__.__name__}')
		# do the train
		start_time = time.time()
		scored, loss = doTheTrain(dataset, model)
		end_time = time.time()
		total_time = end_time - start_time
		print(f'Finished {name} dataset with {model.__class__.__name__}')
		print('----------------------')

		# save the result
		result_df = pd.concat([result_df, pd.DataFrame({
			'model': [model.__class__.__name__],
			'dataset': [name],
			'avg_loss': [loss],
			'avg_accuracy': [scored],
			'total_time': [total_time]
		})], ignore_index=True)

print('Finished all datasets')

# print the result
print(result_df)



Running gi4e_full dataset with Classifier


RuntimeError: CUDA error: device-side assert triggered
CUDA kernel errors might be asynchronously reported at some other API call, so the stacktrace below might be incorrect.
For debugging consider passing CUDA_LAUNCH_BLOCKING=1
Compile with `TORCH_USE_CUDA_DSA` to enable device-side assertions.


4. print the result

In [None]:
# swap the first two columns
result_df = result_df[['dataset', 'model', 'avg_loss', 'avg_accuracy', 'total_time']]
# scale the avg_accuracy to 0-100
result_df['avg_accuracy'] = 100 * (1 - result_df['avg_accuracy'])
# display the total time in the format HH:MM:SS
result_df['total_time'] = pd.to_timedelta(result_df['total_time'], unit='s')

# save the result to csv
result_df.to_csv(f'results_{time_str}.csv', index=False)
# print the result
print(result_df)

              dataset     model  avg_loss  avg_accuracy  \
0           gi4e_full    ResNet  0.000011     99.981028   
1           gi4e_full  DenseNet  0.000229     99.993595   
2           gi4e_full       VGG  0.059837     99.096932   
3       gi4e_raw_eyes    ResNet  0.004592     94.986418   
4       gi4e_raw_eyes  DenseNet  0.005347     95.743190   
5       gi4e_raw_eyes       VGG  0.119210     78.677075   
6  gi4e_detected_eyes    ResNet  0.122154     94.245342   
7  gi4e_detected_eyes  DenseNet  0.003370     97.697311   
8  gi4e_detected_eyes       VGG  0.031279     93.412539   

                 total_time  
0 0 days 00:26:04.910116911  
1 0 days 00:15:41.770978928  
2 0 days 00:19:16.193440437  
3 0 days 00:12:16.112033606  
4 0 days 00:10:20.350670099  
5 0 days 00:15:50.633701324  
6 0 days 00:09:34.279892683  
7 0 days 00:10:33.354367256  
8 0 days 00:16:07.067535877  


In [None]:
print(result_df)

              dataset     model  avg_loss  avg_accuracy  \
0           gi4e_full    ResNet  0.000011     99.981028   
1           gi4e_full  DenseNet  0.000229     99.993595   
2           gi4e_full       VGG  0.059837     99.096932   
3       gi4e_raw_eyes    ResNet  0.004592     94.986418   
4       gi4e_raw_eyes  DenseNet  0.005347     95.743190   
5       gi4e_raw_eyes       VGG  0.119210     78.677075   
6  gi4e_detected_eyes    ResNet  0.122154     94.245342   
7  gi4e_detected_eyes  DenseNet  0.003370     97.697311   
8  gi4e_detected_eyes       VGG  0.031279     93.412539   

                 total_time  
0 0 days 00:26:04.910116911  
1 0 days 00:15:41.770978928  
2 0 days 00:19:16.193440437  
3 0 days 00:12:16.112033606  
4 0 days 00:10:20.350670099  
5 0 days 00:15:50.633701324  
6 0 days 00:09:34.279892683  
7 0 days 00:10:33.354367256  
8 0 days 00:16:07.067535877  


# Embedded Classification

- Define the model

In [None]:
embedded_models = [md.FeatureExtractor(model) for model in models]
classifier_models_temp = [md.Classifier(model) for model in models]




- Load the trained weight to the model

In [None]:
# ignore

- Transform the dataset to the embedded data

In [None]:
classifier_df = pd.DataFrame(columns=['key', 'dataset', 'model'])

for name, dataset in datasets.items():
  for model in embedded_models:
    print(f'Getting features for {name} dataset with {model.__class__.__name__}')

    # get the classifier model from the model
    classifier_model = next((m for m in classifier_models_temp if m.__class__.__name__ ==
                            model.__class__.__name__.replace('FeatureExtractor', 'Classifier')), None)
    if classifier_model is None:
      print(f'Classifier model not found for {model.__class__.__name__}')
      continue

    model_dataset = ds.EmbeddedDataset(dataset, model)

    classifier_df = pd.concat([classifier_df, pd.DataFrame({
        'key': [f'{name}_{model.__class__.__name__}'],
        'model': [classifier_model],
        'dataset': [model_dataset]
    })], ignore_index=True)

    print(f'Finished getting features for {name} dataset with {model.__class__.__name__}')

- Train all defined model on each registered datasets

In [None]:
result_df = pd.DataFrame(columns=['dataset', 'model', 'avg_loss', 'avg_accuracy', 'total_time'])

for index, row in classifier_df.iterrows():
  dataset = row['dataset']
  model = row['model']
  key = row['key']

  print(f'Running {key} dataset with {model.__class__.__name__}')
  # do the train
  start_time = time.time()
  scored, loss = doTheTrain(dataset, model)
  end_time = time.time()
  total_time = end_time - start_time
  print(f'Finished {key} dataset with {model.__class__.__name__}')
  print('----------------------')

  # save the result
  result_df = pd.concat([result_df, pd.DataFrame({
      'model': [model.__class__.__name__],
      'dataset': [dataset.__class__.__name__],
      'avg_loss': [loss],
      'avg_accuracy': [scored],
      'total_time': [total_time]
  })], ignore_index=True)

Running gi4e_full dataset with Classifier


RuntimeError: CUDA error: device-side assert triggered
CUDA kernel errors might be asynchronously reported at some other API call, so the stacktrace below might be incorrect.
For debugging consider passing CUDA_LAUNCH_BLOCKING=1
Compile with `TORCH_USE_CUDA_DSA` to enable device-side assertions.


- Print the result

In [None]:
# swap the first two columns
result_df = result_df[['dataset', 'model', 'avg_loss', 'avg_accuracy', 'total_time']]
# scale the avg_accuracy to 0-100
result_df['avg_accuracy'] = 100 * (1 - result_df['avg_accuracy'])
# display the total time in the format HH:MM:SS
result_df['total_time'] = pd.to_timedelta(result_df['total_time'], unit='s')

# save the result to csv
result_df.to_csv(f'results_{time_str}.csv', index=False)
# print the result
print(result_df)

In [8]:
models = [
	torchvision.models.resnet50(weights=torchvision.models.ResNet50_Weights.DEFAULT),
  torchvision.models.densenet121(weights=torchvision.models.DenseNet121_Weights.DEFAULT),
  torchvision.models.vgg16(weights=torchvision.models.VGG16_Weights.DEFAULT)
]

for model in models:
  # explore the model
	print(f'Model: {model.__class__.__name__}')
	
	# explain the model
	print(f'Number of layers: {len(list(model.children()))}')
	print(model)

Model: ResNet
Number of layers: 10
ResNet(
  (conv1): Conv2d(3, 64, kernel_size=(7, 7), stride=(2, 2), padding=(3, 3), bias=False)
  (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
  (relu): ReLU(inplace=True)
  (maxpool): MaxPool2d(kernel_size=3, stride=2, padding=1, dilation=1, ceil_mode=False)
  (layer1): Sequential(
    (0): Bottleneck(
      (conv1): Conv2d(64, 64, kernel_size=(1, 1), stride=(1, 1), bias=False)
      (bn1): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (conv2): Conv2d(64, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1), bias=False)
      (bn2): BatchNorm2d(64, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (conv3): Conv2d(64, 256, kernel_size=(1, 1), stride=(1, 1), bias=False)
      (bn3): BatchNorm2d(256, eps=1e-05, momentum=0.1, affine=True, track_running_stats=True)
      (relu): ReLU(inplace=True)
      (downsample): Sequential(
        (0): Conv2d(64, 2