In [1]:
import os

from pathlib import Path

import pandas as pd
import numpy as np
import torch
import torch.nn as nn

from PIL import Image
from torch.utils.data import Dataset, DataLoader
from torchvision import datasets, models, transforms

In [2]:
ROOT_DIR = '../'
MODEL_PATH = ROOT_DIR + 'models/Patryk-ResNeXt-more-layers-model.pkt'
TRAINING_LABELS_PATH = ROOT_DIR + 'data/training_labels.csv'
TEST_DATA_PATH = ROOT_DIR + 'data/live_test_images'
SUBMISSION_FILE = ROOT_DIR + 'results/submission.csv'
OPTIMAL_THRESHOLD_PATH = ROOT_DIR + 'models/optimal_thresholds.npy'

DEVICE = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

print(DEVICE)

cpu


  return torch._C._cuda_getDeviceCount() > 0


In [3]:
class TestDataset(Dataset):

    def __init__(self, img_dir, transform):
        self.transform = transform
        self.images = [os.path.join(img_dir, fname) for fname in os.listdir(img_dir)]

    def __getitem__(self, idx):
        image = Image.open(self.images[idx]).convert("RGB")

        if self.transform is not None:
            image = self.transform(image)
        return image
  
    def __len__(self):
        return len(self.images)

In [4]:
model = torch.load(MODEL_PATH, map_location=DEVICE)

In [5]:
batch_size = 16
transform = transforms.Compose([
    transforms.Resize(256),
    transforms.CenterCrop(224),
    transforms.ToTensor(),
    transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
])

test_set = TestDataset(TEST_DATA_PATH, transform)
test_loader = DataLoader(test_set, shuffle=False, batch_size=batch_size)

In [6]:
results = []

for batch in test_loader:
    res = model(batch.to(DEVICE))
    res = torch.sigmoid(res).to(torch.float32).cpu().detach().numpy()
    results.append(res)

In [7]:
with open(OPTIMAL_THRESHOLD_PATH, 'rb') as f:
    optimal_thresholds = np.load(f)

In [8]:
optimal_thresholds

array([0.26666667, 0.45454545, 0.28571429, 0.43333333, 0.42105263,
       0.5       , 0.45762712, 0.38709677, 0.39622642, 0.30434783,
       0.33333333, 0.29861111, 0.35443038, 0.3968254 , 0.38541667,
       0.39130435, 0.38888889, 0.34848485, 0.36842105, 0.38461538,
       0.27160494, 0.34615385, 0.33333333, 0.09090909, 0.15789474,
       0.45971564, 0.34944238, 0.39393939, 0.36363636, 0.35658915,
       0.41463415, 0.5       , 0.41176471, 0.33333333, 0.13114754,
       0.44827586, 0.5       , 0.37944664])

In [9]:
df = pd.read_csv(TRAINING_LABELS_PATH)
df_test = pd.DataFrame(np.vstack(results), columns = df.columns[1:])
df_test = (df_test > optimal_thresholds).astype(int) # Threshold optimization
names = pd.DataFrame({'Name': [Path(el).parts[-1] for el in test_loader.dataset.images]})

submission = pd.concat([names, df_test], axis = 1)
submission.to_csv(SUBMISSION_FILE, index = False)