In [1]:
import pytorch_lightning as pl
import torch 
from pytorch_lightning.metrics.functional.classification import accuracy
from tqdm import tqdm
from src import DataModule, Resnet
import torchvision
import pandas as pd 
from pathlib import Path
from skimage import io

In [2]:
dm = DataModule(
    path = Path('data'), 
    batch_size=64
)
dm.setup()

Training samples:  17117
Validation samples:  4280


In [3]:
checkpoint = torch.load('./resnet18-256-val_acc=0.78398.ckpt')
hparams = checkpoint['hyper_parameters']
hparams

{'lr': 0.0003,
 'optimizer': 'Adam',
 'batch_size': 256,
 'max_epochs': 50,
 'precision': 16,
 'subset': 0.1,
 'test_size': 0.2,
 'seed': 42,
 'size': 256,
 'backbone': 'resnet18',
 'val_batches': 10,
 'extra_data': 1}

In [4]:
model = Resnet.load_from_checkpoint(checkpoint_path='./resnet18-256-val_acc=0.78398.ckpt')
model.hparams

"backbone":    resnet18
"batch_size":  256
"extra_data":  1
"lr":          0.0003
"max_epochs":  50
"optimizer":   Adam
"precision":   16
"seed":        42
"size":        256
"subset":      0.1
"test_size":   0.2
"val_batches": 10

In [5]:
 def evaluate(model, dl):   
    model.eval()
    model.cuda()
    acc = []
    with torch.no_grad():
        t = tqdm(dl)
        for x, y in t:
            x, y = x.cuda(), y.cuda()
            y_hat = model(x)
            acc.append(accuracy(y_hat, y).item())
            t.set_description(f"acc {np.mean(acc):.5f}")
            
evaluate(model, dm.val_dataloader())

acc 0.79734: 100%|██████████████████████████████████████████| 67/67 [00:44<00:00,  1.52it/s]


In [6]:
class Preprocess(torch.nn.Module):
    def __init__(self):
        super().__init__()
    def forward(self, x):
        x = x.float() / 255.
        x = x.permute(0, 3, 1, 2)
        return x 
    
class Postprocess(torch.nn.Module):
    def __init__(self):
        super().__init__()
    def forward(self, x):
        return torch.argmax(x, dim=1)

In [7]:
script = torch.jit.script(torch.nn.Sequential(
    Preprocess(),
    model.resnet.cpu(),
    Postprocess()
))
torch.jit.save(script, "model.pt")

In [8]:
 def evaluate2(model, dl):   
    model.eval()
    model.cuda()
    acc = []
    with torch.no_grad():
        t = tqdm(dl)
        for x, y in t:
            x, y = x.cuda(), y.cuda()
            # simulate test
            x *= 255. 
            x = x.permute(0, 2, 3, 1).long()
            #print(x.shape, x.dtype, x.max(), x.min())
            y_hat = model(x)
            acc.append(accuracy(y_hat, y).item())
            t.set_description(f"acc {np.mean(acc):.5f}")

In [9]:
loaded = torch.jit.load('model.pt')
evaluate2(loaded, dm.val_dataloader())

acc 0.79714: 100%|██████████████████████████████████████████| 67/67 [00:43<00:00,  1.56it/s]


In [10]:
path = Path('./data/test_images')
images = os.listdir(path)
images_paths = [str(path/img) for img in images]
len(images)

1

In [11]:
def predict(model, images, bs=32):   
    model.eval()
    model.cuda()
    preds = torch.tensor([]).cuda()
    batches = len(images) // bs + 1
    print(batches)
    with torch.no_grad():
        for b in tqdm(range(batches)):
            imgs = images[bs*b:bs*(b+1)]
            imgs = torch.from_numpy(np.array([io.imread(img) for img in imgs]))
            y_hat = model(imgs.cuda())
            preds = torch.cat([preds, y_hat])
    return preds.long().cpu().numpy()

In [12]:
loaded = torch.jit.load('model.pt')
preds = predict(loaded, images_paths)
preds

100%|███████████████████████████████████████| 1/1 [00:00<00:00, 12.99it/s]

1





array([4], dtype=int64)

In [13]:
submission = pd.DataFrame({'image_id': images, 'label': preds })
submission

Unnamed: 0,image_id,label
0,2216849948.jpg,4


In [14]:
submission.to_csv('submission.csv', index=False)