In [1]:
import time
import os
import copy
from collections import defaultdict

# deep learning/vision libraries
import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
from torchvision import datasets, models, transforms
import cv2 as cv  # OpenCV

# numeric and plotting libraries
import numpy as np
import matplotlib.pyplot as plt
from kard_data_loader import KardDataLoader
import consts as c

In [7]:
train = KardDataLoader('C:\\Users\\bozam\\Desktop\\KARD_all_in_one_folder')
train.getActivityData(c.FILETYPES['screen'])

In [8]:
def normalize(arr):
    return (arr - np.min(arr)) / (np.max(arr) - np.min(arr))

In [9]:
def make_training_set(data):
    generated_images = []
    generated_classes = []
    x = []
    y = []
    z = []
            
    for class_name in range(len(data)):
        image_sequence = []
        for people_sequences in range(len(data[class_name])):
            counter = 0
            for people_coordinates in data[class_name][people_sequences]:
                x.append(people_coordinates[0])
                y.append(people_coordinates[1])
                z.append(people_coordinates[2])
                counter += 1
                
                if counter == 15:
                    counter = 0
                    x = normalize(x)
                    
                    y = normalize(y)
                    
                    z = normalize(z)
                    
                    image_layer = [[x[i], y[i], z[i]] for i in range(15)]
                    generated_images.append(image_layer)
                    generated_classes.append(class_name)
                    x = []
                    y = []
                    z = []
            
    return generated_images, generated_classes

In [12]:
train_images, train_labels = make_training_set(train.data)

In [13]:
print(np.array(train_images).shape)
print(np.array(train_labels).shape)

(63630, 15, 3)
(63630,)


In [105]:
def make_baches(train_data, train_labels, batch_size, stride):
    batch_edges = [[a, a + batch_size] for a in range(0 , len(train_data) - batch_size, stride) if train_labels[a] == train_labels[a + batch_size]]
    
    batch_data = []
    batch_labels = []
    
    for (a, b) in (batch_edges):
        batch_data.append(train_data[a:b])
        batch_labels.append([train_labels[a] for _ in range(batch_size)])
    
    rnd_idx = np.random.permutation(len(batch_data))
    batch_data = np.array(batch_data)
    batch_labels = np.array(batch_labels)
    
    batch_data = batch_data[rnd_idx]
    batch_labels = batch_labels[rnd_idx]
    
    for i in range(len(batch_data)):
        yield (batch_data[i], batch_labels[i].reshape(-1, 1))
     

In [106]:
device = torch.device("cuda:0" if torch.cuda.is_available() else "cpu")

In [107]:
def count_parameters(model):
    return sum(p.numel() for p in model.parameters() if p.requires_grad)

In [114]:
def train_model(model, criterion, optimizer, num_epochs=100):
    start_time = time.time()

    best_model_wts = copy.deepcopy(model.state_dict())
    best_acc = 0.0
    
    metrics = defaultdict(list)

    for epoch in range(num_epochs):
        print(f'Epoch {epoch}/{num_epochs - 1}')
        print('-' * 10)

        # Each epoch has a training and validation phase
        for phase in ['train', 'val']:
            if phase == 'train':
                model.train()  # Set model to training mode
            else:
                model.eval()   # Set model to evaluate mode

            running_loss = 0.0
            running_corrects = 0

            # Iterate over data.
            for inputs, labels in make_baches(train_images, train_labels, 40, 3):
                inputs = torch.from_numpy(inputs)
                labels = torch.from_numpy(labels)
                inputs = inputs.to(device)
                labels = labels.to(device)

                # zero the parameter gradients
                optimizer.zero_grad()
                
                # forward
                # track history if only in train
                with torch.set_grad_enabled(phase == 'train'):
                    outputs = model(inputs.float())
                    
                    _, preds = torch.max(outputs, 1)
                    loss = criterion(outputs.float(), labels.long())

                    # backward + optimize only if in training phase
                    if phase == 'train':
                        loss.backward()
                        optimizer.step()

                # statistics
                running_loss += loss.item() * inputs.size(0)
                running_corrects += torch.sum(preds == labels.data).item()

            epoch_loss = running_loss / dataset_sizes[phase]
            epoch_acc = float(running_corrects) / dataset_sizes[phase]

            print(f'{phase} Loss: {epoch_loss:.4f} Acc: {epoch_acc:.4f}')
            
            metrics[phase+"_loss"].append(epoch_loss)
            metrics[phase+"_acc"].append(epoch_acc)

In [115]:
class CustomCNN(nn.Module):
    # [50, 100, 3, 3], but got 3-dimensional input of size [40, 15, 3]
    def __init__(self):
        super().__init__()
        num_of_channels = [15, 40, 2]
        kernel_sizes = [3, 1, 1]
        stride_sizes = [2, 2, 2]
        
        self.relu = torch.nn.ReLU()
        
        self.conv1 = nn.Conv1d(num_of_channels[0], num_of_channels[1], kernel_size=kernel_sizes[0])
        self.conv2 = nn.Conv1d(num_of_channels[1], num_of_channels[2], kernel_size=kernel_sizes[1])
        self.classifier = nn.Softmax(num_of_channels[-1])
        
    def forward(self, x):
        y = self.relu(self.conv1(x))
        y = self.relu(self.conv2(y))
        y = self.classifier(y)
        return y
    
custom_cnn = CustomCNN().to(device)
optimizer_conv = optim.Adam(filter(lambda p: p.requires_grad, custom_cnn.parameters()))

print(f"number of params in model {count_parameters(custom_cnn)}")

#
# todo: (#11) Why is acc 0.5? Anybody?
#
criterion = nn.CrossEntropyLoss()
model_conv, metrics = train_model(custom_cnn, criterion, optimizer_conv, num_epochs=25)

plt.subplots_adjust(wspace=1, hspace=1)
fig, ax = plt.subplots(nrows=2, ncols=2)
keys = list(metrics.keys())
cnt = 0
for row in ax:
    for col in row:
        col.set_title(keys[cnt])
        col.plot(metrics[keys[cnt]])
        cnt += 1

number of params in model 1922
Epoch 0/24
----------


IndexError: Target 6 is out of bounds.