In [1]:
!pip install compressai

Collecting compressai
  Downloading compressai-1.2.0-cp37-cp37m-manylinux_2_17_x86_64.manylinux2014_x86_64.whl (295 kB)
[?25l[K     |█                               | 10 kB 30.6 MB/s eta 0:00:01[K     |██▏                             | 20 kB 37.8 MB/s eta 0:00:01[K     |███▎                            | 30 kB 42.5 MB/s eta 0:00:01[K     |████▍                           | 40 kB 45.9 MB/s eta 0:00:01[K     |█████▌                          | 51 kB 20.6 MB/s eta 0:00:01[K     |██████▋                         | 61 kB 23.4 MB/s eta 0:00:01[K     |███████▊                        | 71 kB 24.6 MB/s eta 0:00:01[K     |████████▉                       | 81 kB 26.3 MB/s eta 0:00:01[K     |██████████                      | 92 kB 28.3 MB/s eta 0:00:01[K     |███████████                     | 102 kB 30.2 MB/s eta 0:00:01[K     |████████████▏                   | 112 kB 30.2 MB/s eta 0:00:01[K     |█████████████▎                  | 122 kB 30.2 MB/s eta 0:00:01[K     |█████████

In [2]:
import argparse
import math
import random
import shutil
import sys
import time
import numpy as np

import torch
import torch.nn as nn
import torch.optim as optim

from torch.utils.data import DataLoader
from torchvision import transforms
import torchvision

from compressai.datasets import ImageFolder
from compressai.zoo import image_models
import compressai

In [3]:
from compressai.zoo import (bmshj2018_factorized, bmshj2018_hyperprior, mbt2018_mean, mbt2018, cheng2020_anchor)
device = 'cuda' if torch.cuda.is_available() else 'cpu'
metric = 'mse'  # only pre-trained model for mse are available for now
quality = 1     # lower quality -> lower bit-rate (use lower quality to clearly see visual differences in the notebook)
networks = {
    'bmshj2018-factorized': bmshj2018_factorized(quality=quality, pretrained=True).eval().to(device),
    'bmshj2018-hyperprior': bmshj2018_hyperprior(quality=quality, pretrained=True).eval().to(device),
    'mbt2018-mean': mbt2018_mean(quality=quality, pretrained=True).eval().to(device),
    'mbt2018': mbt2018(quality=quality, pretrained=True).eval().to(device),
    'cheng2020-anchor': cheng2020_anchor(quality=quality, pretrained=True).eval().to(device),
}

net = networks['bmshj2018-hyperprior']

Downloading: "https://compressai.s3.amazonaws.com/models/v1/bmshj2018-factorized-prior-1-446d5c7f.pth.tar" to /root/.cache/torch/hub/checkpoints/bmshj2018-factorized-prior-1-446d5c7f.pth.tar


  0%|          | 0.00/11.5M [00:00<?, ?B/s]

Downloading: "https://compressai.s3.amazonaws.com/models/v1/bmshj2018-hyperprior-1-7eb97409.pth.tar" to /root/.cache/torch/hub/checkpoints/bmshj2018-hyperprior-1-7eb97409.pth.tar


  0%|          | 0.00/20.2M [00:00<?, ?B/s]

Downloading: "https://compressai.s3.amazonaws.com/models/v1/mbt2018-mean-1-e522738d.pth.tar" to /root/.cache/torch/hub/checkpoints/mbt2018-mean-1-e522738d.pth.tar


  0%|          | 0.00/27.6M [00:00<?, ?B/s]

Downloading: "https://compressai.s3.amazonaws.com/models/v1/mbt2018-1-3f36cd77.pth.tar" to /root/.cache/torch/hub/checkpoints/mbt2018-1-3f36cd77.pth.tar


  0%|          | 0.00/61.8M [00:00<?, ?B/s]

Downloading: "https://compressai.s3.amazonaws.com/models/v1/cheng2020-anchor-1-dad2ebff.pth.tar" to /root/.cache/torch/hub/checkpoints/cheng2020-anchor-1-dad2ebff.pth.tar


  0%|          | 0.00/49.1M [00:00<?, ?B/s]

In [4]:
net.aux_loss()

tensor(275.8194, device='cuda:0', grad_fn=<AddBackward0>)

In [5]:
from google.colab import drive
drive.mount('MyDrive')

Mounted at MyDrive


In [6]:
import os 
os.chdir(r'/content/MyDrive/MyDrive/DL_Project_HP')

### Model Classes

In [7]:
class RateDistortionLoss(nn.Module):
    """Custom rate distortion loss with a Lagrangian parameter."""

    def __init__(self, lmbda=1e-2):
        super().__init__()
        self.crossEntropy = nn.CrossEntropyLoss()
        self.lmbda = lmbda

    def forward(self, output, target, preds, labels):
        N, _, H, W = target.size()
        out = {}
        num_pixels = N * H * W

        out["bpp_loss"] = sum(
            (torch.log(likelihoods).sum() / (-math.log(2) * num_pixels))
            for likelihoods in output["likelihoods"].values()
        )
        out['log_loss'] = self.crossEntropy(preds, labels)
        out["loss"] = self.lmbda * out["log_loss"] + out["bpp_loss"]

        return out


class AverageMeter:
    """Compute running average."""

    def __init__(self):
        self.val = 0
        self.avg = 0
        self.sum = 0
        self.count = 0

    def update(self, val, n=1):
        self.val = val
        self.sum += val * n
        self.count += n
        self.avg = self.sum / self.count


class CustomDataParallel(nn.DataParallel):
    """Custom DataParallel to access the module methods."""

    def __getattr__(self, key):
        try:
            return super().__getattr__(key)
        except AttributeError:
            return getattr(self.module, key)


def configure_optimizers(net, args):
    """Separate parameters for the main optimizer and the auxiliary optimizer.
    Return two optimizers"""

    parameters = {
        n
        for n, p in net.named_parameters()
        if not n.endswith(".quantiles") and p.requires_grad
    }
    aux_parameters = {
        n
        for n, p in net.named_parameters()
        if n.endswith(".quantiles") and p.requires_grad
    }

    # Make sure we don't have an intersection of parameters
    params_dict = dict(net.named_parameters())
    inter_params = parameters & aux_parameters
    union_params = parameters | aux_parameters

    assert len(inter_params) == 0
    assert len(union_params) - len(params_dict.keys()) == 0

    optimizer = optim.Adam(
        (params_dict[n] for n in sorted(parameters)),
        lr=args.learning_rate
    )
    aux_optimizer = optim.Adam(
        (params_dict[n] for n in sorted(aux_parameters)),
        lr=args.aux_learning_rate,
    )
    return optimizer, aux_optimizer

### Train and Test Epochs

In [8]:
def train_one_epoch(
    model, criterion, train_dataloader, optimizer, aux_optimizer, epoch, clip_max_norm
):
    model.train()
    device = next(model.parameters()).device
    train_acc = 0

    for i, d in enumerate(train_dataloader):
        images = d[0].to(device)
        labels = d[1].to(device)
        images = images.cuda()
        labels = labels.cuda()

        optimizer.zero_grad()
        aux_optimizer.zero_grad()

        if clip_max_norm > 0:
            torch.nn.utils.clip_grad_norm_(model.parameters(), clip_max_norm)

        out_net = model(images)
        preds = out_net['y_hat']
        pred_labels = out_net['y_hat'].argmax(dim=1)
        train_acc += torch.sum(labels == pred_labels).item()
        out_criterion = criterion(out_net, images, preds, labels)
        out_criterion["loss"].backward()



        optimizer.step()

        aux_loss = model.aux_loss()
        aux_loss.backward()
        aux_optimizer.step()

        if i % 100 == 0:
            print(
                f"Train epoch {epoch}: ["
                f"{i*len(images)}/{len(train_dataloader.dataset)}"
                f" ({100. * i / len(train_dataloader):.0f}%)]"

                f'\tLoss: {out_criterion["loss"].item():.4f} |'
                f'\tBpp loss: {out_criterion["bpp_loss"].item():.4f} |'
                f'\tLog loss: {out_criterion["log_loss"].item():.4f} |'
                f"\tAux loss: {aux_loss.item():.4f}"
            )
    train_acc = train_acc/500
    print(f'\nTrain epoch {epoch}: \tAcc: {train_acc:.4f} |')


def test_epoch(epoch, test_dataloader, model, criterion):
    model.eval()
    device = next(model.parameters()).device

    loss = AverageMeter()
    bpp_loss = AverageMeter()
    mse_loss = AverageMeter()
    aux_loss = AverageMeter()
    test_acc = 0
    with torch.no_grad():
        for d in test_dataloader:
            images = d[0].to(device)
            labels = d[1].to(device)
            images = images.cuda()
            labels = labels.cuda()

            out_net = model(images)
            preds = out_net['y_hat']
            pred_labels = out_net['y_hat'].argmax(dim=1)
            test_acc += torch.sum(labels == pred_labels).item()

            out_criterion = criterion(out_net, images, preds, labels)

            aux_loss.update(model.aux_loss())
            bpp_loss.update(out_criterion["bpp_loss"])
            loss.update(out_criterion["loss"])
    test_acc = test_acc / 100
    print(
        f"Test epoch {epoch}: Average losses:"
        f'\tAcc: {test_acc:.4f} |'
        f"\tLoss: {loss.avg:.4f} |"
        f"\tBpp loss: {bpp_loss.avg:.4f} |"
        f'\tLog loss: {out_criterion["log_loss"].item():.4f} |'
        f"\tAux loss: {aux_loss.avg:.4f}\n"
    )

    return loss.avg, bpp_loss.avg, test_acc


def save_checkpoint(state, epoch, is_best, filename, best_filename):
    torch.save(state, filename)
    if is_best:
        shutil.copyfile(filename, best_filename)


### Main

In [9]:
def main(model, num_workers, batch_size, cuda, epoch, patch_size, learning_rate, lmbda):
    # args = parse_args(argv)

    # if args.seed is not None:
    #     torch.manual_seed(args.seed)
    #     random.seed(args.seed)

    class arguments:
      def __init__(self, model, num_workers, batch_size, cuda, epoch, patch_size, learning_rate, lmbda):
        self.model = model
        self.num_workers = num_workers
        self.batch_size = batch_size
        self.test_batch_size = 100
        self.cuda = cuda
        self.epochs = epoch
        self.patch_size = patch_size
        self.learning_rate = learning_rate
        self.aux_learning_rate = learning_rate
        self.lmbda = lmbda
        self.save = True
        self.seed = False
        self.clip_max_norm = 1.0
        self.checkpoint = False


    tr_mean = np.asarray([0.4914, 0.4822, 0.4465])
    tr_std = np.asarray([0.247, 0.243, 0.261])

    args = arguments(model, num_workers, batch_size, cuda, epoch, patch_size, learning_rate, lmbda)

    train_transforms = transforms.Compose(
        [transforms.Resize((64,64)), transforms.ToTensor(), transforms.RandomCrop(args.patch_size), torchvision.transforms.Normalize(tr_mean, tr_std)]
    )

    test_transforms = transforms.Compose(
        [transforms.Resize((64,64)), transforms.ToTensor(), transforms.CenterCrop(args.patch_size), torchvision.transforms.Normalize(tr_mean, tr_std)]
    )

    # train_dataset = ImageFolder(args.dataset, split="train", transform=train_transforms)
    # test_dataset = ImageFolder(args.dataset, split="test", transform=test_transforms)

    train_dataset = torchvision.datasets.CIFAR10('./CIFAR-10/',train=True,download=True, transform=train_transforms)
    test_dataset = torchvision.datasets.CIFAR10('./CIFAR-10/',train=False,download=True, transform=test_transforms)

    device = "cuda" if args.cuda and torch.cuda.is_available() else "cpu"

    train_dataloader = DataLoader(
        train_dataset,
        batch_size=args.batch_size,
        num_workers=args.num_workers,
        shuffle=True,
        pin_memory=(device == "cuda"),
    )
    test_dataloader = DataLoader(
        test_dataset,
        batch_size=args.test_batch_size,
        num_workers=args.num_workers,
        shuffle=False,
        pin_memory=(device == "cuda"),
    )


    ##########################################################################
    net = model
    resnet = torchvision.models.resnet18(pretrained = True)
    resnet.fc = nn.Linear(in_features=512, out_features=10, bias=True)

    class Net(nn.Module):
        def __init__(self, resnet, net):
            super(Net, self).__init__()

            self.g_a = net.g_a
            self.h_a = net.h_a
            self.g_s = net.g_s
            self.h_s = net.h_s
            self.entropy_bottleneck = net.entropy_bottleneck
            self.gaussian_conditional = net.gaussian_conditional
            self.res = resnet

        def forward(self, x):
            y = self.g_a(x)
            z = self.h_a(torch.abs(y))
            z_hat, z_likelihoods = self.entropy_bottleneck(z)
            scales_hat = self.h_s(z_hat)
            y_hat, y_likelihoods = self.gaussian_conditional(y, scales_hat)
            x_hat = self.g_s(y_hat)
            l_hat = self.res(x_hat)

            return {
                "x_hat": x_hat,
                "y_hat": l_hat,
                "likelihoods": {"y": y_likelihoods, "z": z_likelihoods},
            }


    net = Net(resnet, net)
    net.aux_loss = model.aux_loss
    net = net.to(device)
    ##########################################################################


    if args.cuda and torch.cuda.device_count() > 1:
        net = CustomDataParallel(net)

    optimizer, aux_optimizer = configure_optimizers(net, args)
    lr_scheduler = optim.lr_scheduler.ReduceLROnPlateau(optimizer, "min",factor=0.5)
    criterion = RateDistortionLoss(lmbda=args.lmbda)

    filename = str(args.lmbda) + '_check.pth.tar'
    best_filename = 'best' + filename

    last_epoch = 0
    if args.checkpoint:  # load from previous checkpoint
        print("Loading", args.checkpoint)
        checkpoint = torch.load(args.checkpoint, map_location=device)
        last_epoch = checkpoint["epoch"] + 1
        net.load_state_dict(checkpoint["state_dict"])
        optimizer.load_state_dict(checkpoint["optimizer"])
        aux_optimizer.load_state_dict(checkpoint["aux_optimizer"])
        lr_scheduler.load_state_dict(checkpoint["lr_scheduler"])

    best_loss = float("inf")
    for epoch in range(last_epoch, args.epochs):
        T11 = time.time()

        print(f"Learning rate: {optimizer.param_groups[0]['lr']}")
        train_one_epoch(
            net,
            criterion,
            train_dataloader,
            optimizer,
            aux_optimizer,
            epoch,
            args.clip_max_norm,
        )
        loss, bpp_loss, test_acc = test_epoch(epoch, test_dataloader, net, criterion)
        lr_scheduler.step(loss)
        T22 = time.time()
        print(f"Time: {T22-T11:.4f}")
        is_best = loss < best_loss
        best_loss = min(loss, best_loss)

        if args.save:
            save_checkpoint(
                {
                    "epoch": epoch,
                    "state_dict": net.state_dict(),
                    "loss": loss,
                    "bpp_loss": bpp_loss,
                    "acc": test_acc,
                    "optimizer": optimizer.state_dict(),
                    "aux_optimizer": aux_optimizer.state_dict(),
                    "lr_scheduler": lr_scheduler.state_dict(),
                },
                epoch,
                is_best,
                filename,
                best_filename,
            )


In [10]:
net = networks['bmshj2018-hyperprior']
net_out = main(net, 2, 64, 1, 20, 64, 0.001, 2.0)

Files already downloaded and verified
Files already downloaded and verified


Downloading: "https://download.pytorch.org/models/resnet18-f37072fd.pth" to /root/.cache/torch/hub/checkpoints/resnet18-f37072fd.pth


  0%|          | 0.00/44.7M [00:00<?, ?B/s]

Learning rate: 0.001

Train epoch 0: 	Acc: 41.3320 |
Test epoch 0: Average losses:	Acc: 50.2600 |	Loss: 2.8710 |	Bpp loss: 0.1158 |	Log loss: 1.2965 |	Aux loss: 459.7003

Time: 97.6951
Learning rate: 0.001

Train epoch 1: 	Acc: 59.9940 |
Test epoch 1: Average losses:	Acc: 60.4500 |	Loss: 2.3824 |	Bpp loss: 0.1280 |	Log loss: 0.9834 |	Aux loss: 335.8065

Time: 97.4023
Learning rate: 0.001

Train epoch 2: 	Acc: 67.6960 |
Test epoch 2: Average losses:	Acc: 66.2000 |	Loss: 2.0694 |	Bpp loss: 0.1394 |	Log loss: 0.9340 |	Aux loss: 289.8326

Time: 97.7346
Learning rate: 0.001

Train epoch 3: 	Acc: 72.6720 |
Test epoch 3: Average losses:	Acc: 69.6500 |	Loss: 1.9230 |	Bpp loss: 0.1489 |	Log loss: 0.9305 |	Aux loss: 241.9588

Time: 97.7139
Learning rate: 0.001

Train epoch 4: 	Acc: 76.6200 |
Test epoch 4: Average losses:	Acc: 69.1500 |	Loss: 2.0559 |	Bpp loss: 0.1577 |	Log loss: 0.9933 |	Aux loss: 215.6830

Time: 97.6818
Learning rate: 0.001

Train epoch 5: 	Acc: 80.1720 |
Test epoch 5: Average 

In [14]:
import os
os.getcwd()

'/content/MyDrive/MyDrive/DL_Project_HP'

## Data Prepration for Classification

In [11]:
train_transforms = transforms.Compose(
    [transforms.Resize((64,64)), transforms.RandomCrop(64), transforms.ToTensor()]
)

test_transforms = transforms.Compose(
    [transforms.Resize((64,64)), transforms.CenterCrop(64), transforms.ToTensor()]
)

# train_dataset = ImageFolder(args.dataset, split="train", transform=train_transforms)
# test_dataset = ImageFolder(args.dataset, split="test", transform=test_transforms)

train_dataset = torchvision.datasets.CIFAR10('./CIFAR-10/',train=True,download=True, transform=train_transforms)
test_dataset = torchvision.datasets.CIFAR10('./CIFAR-10/',train=False,download=True, transform=test_transforms)

Files already downloaded and verified
Files already downloaded and verified


In [None]:
checkpoint = torch.load('/content/MyDrive/MyDrive/DL_Project_HP/best2.0_check.pth.tar', map_location=device)
net.load_state_dict(checkpoint["state_dict"])
net.to('cuda');

In [None]:
train_dataloader = DataLoader(
    train_dataset,
    batch_size=64,
    num_workers=2,
    shuffle=True,
    pin_memory=(device == "cuda"),
)

test_dataloader = DataLoader(
    test_dataset,
    batch_size=64,
    num_workers=2,
    shuffle=False,
    pin_memory=(device == "cuda"),
)

## ResNet

In [None]:
resnet = torchvision.models.resnet18(pretrained=True)
resnet.fc = nn.Linear(in_features=512, out_features=10, bias=True)
resnet.to('cuda')
Loss = nn.CrossEntropyLoss()
optimizer = torch.optim.Adam(resnet.parameters(), lr=0.001)
lr_scheduler = optim.lr_scheduler.ReduceLROnPlateau(optimizer, "min")

In [None]:
Nepoch = 15
for epoch in range(Nepoch): 
    train_loss = 0.0
    test_loss = 0.0
    t1 = time.time()
    train_acc = 0.0
    test_acc = 0.0

    for i, data in enumerate(train_dataloader):
        images, labels = data
        images = images.cuda()
        ic_out = net(images)
        images = ic_out["x_hat"]
        labels = labels.cuda()
        optimizer.zero_grad()
        predicted_output = resnet(images)
        fit = Loss(predicted_output,labels)
        fit.backward()
        optimizer.step()   
        train_loss += fit.item()
        train_acc += torch.sum(labels == predicted_output.argmax(dim=1)).item()

    for i, data in enumerate(test_dataloader):
        with torch.no_grad():
            images, labels = data
            images = images.cuda()
            labels = labels.cuda()
            ic_out = net(images)
            images = ic_out["x_hat"]
            labels = labels.cuda()
            predicted_output = resnet(images)
            fit = Loss(predicted_output,labels)
            test_loss += fit.item()
            test_acc += torch.sum(labels == predicted_output.argmax(dim=1)).item()

    train_loss = train_loss/len(train_dataset)
    test_loss = test_loss/len(test_dataset)
    train_acc = train_acc/len(train_dataset)
    test_acc = test_acc/len(test_dataset)
    t2 = time.time()

    print(f'Epoch: {epoch} \tTrain Loss: {train_loss:.5f} \tTrain Acc: {train_acc:.4f} \tTest Loss: {test_loss:.5f} \tTest Acc: {test_acc:.4f} \tTime: {t2-t1:.4f}')