In [None]:
import torch
import torch.optim as optim
import torch.utils.data as data
import torch.nn as nn
import torch.nn.functional as F
import numpy as np
from tqdm import trange, tqdm_notebook
import copy
from torch.distributions.uniform import Uniform
from torch.distributions.normal import Normal
import matplotlib.pyplot as plt
from scipy.stats import norm
from scipy.linalg import sqrtm
from torchvision import models
from torchvision import transforms
from PIL import Image

In [None]:
class I(nn.Module):
  def __init__(self):
    super().__init__()
    self.model = torch.hub.load('pytorch/vision:v0.10.0', 'inception_v3', pretrained=True)
    self.model.eval()

    #self.model = timm.create_model('inception_v3', pretrained=True, features_only=True)

  def forward(self, x):
    #https://discuss.pytorch.org/t/extract-the-2048-vector-of-a-fine-tuned-inception-v3-on-test-set/152510/4 
    activation = {}
    def get_activation(name):
        def hook(model, input, output):
            activation[name] = output.detach()
        return hook

    self.model.avgpool.register_forward_hook(get_activation("avgpool"))

    out = self.model(x)

    return activation['avgpool'].squeeze(3).squeeze(2)


In [None]:
class FID(nn.Module):
  def __init__(self):
    super().__init__()
    self.inception = I()
  
  def forward(self, x, y):
    with torch.no_grad():
      features_x = self.inception(x).detach().cpu().numpy()
      features_y = self.inception(y).detach().cpu().numpy()
      #print(features_x)
      #print(features_y)
      mu_x = features_x.mean(axis=0)
      mu_y = features_y.mean(axis=0)
      mu_part = np.dot(mu_x - mu_y, mu_x - mu_y)
      #print(mu_part)
      covariance_x = np.cov(features_x, rowvar=False)
      covariance_y = np.cov(features_y, rowvar=False)
      #print(covariance_x)
      #print(covariance_y)
      #print(np.multiply(covariance_x, covariance_y).shape)
      trace = covariance_x + covariance_y - 2 * sqrtm(np.dot(covariance_x, covariance_y))
      trace = np.trace(trace.real)
      #print(trace)
      fid = mu_part - trace
      #print(f"real fid: {fid}")
      #return features_x, features_y
      return fid


In [None]:
def fid_experiment():
  toTensorTransform = transforms.ToTensor()
  sample_number_1 = 70 #TODO correct this
  sample_number_2 = 70 #TODO correct this

  inputs1 = torch.zeros([sample_number_1, 3, 256, 256]) #TODO fix size
  for i in range(sample_number_1):
    #img = Image.open("generated_sketch_" + str(i) + ".jpg")
    img = Image.open("exp13/"+str(i) + ".jpg")
    tensor = toTensorTransform(img)
    tensor = tensor.unsqueeze(0)
    inputs1[i] = tensor
  inputs1 = inputs1.cuda()

  inputs2 = torch.zeros([sample_number_2, 3, 256, 256]) #TODO fix size
  for i in range(sample_number_2):
    img = Image.open("truth_sketch_" + str(i) + ".jpg")
    tensor = toTensorTransform(img)
    tensor = tensor.unsqueeze(0)
    inputs2[i] = tensor
  inputs2 = inputs2.cuda()

  fid = FID().cuda()
  fid_val = fid(inputs1, inputs2)

  return fid_val


In [None]:
fid_experiment()

Downloading: "https://github.com/pytorch/vision/archive/v0.10.0.zip" to /root/.cache/torch/hub/v0.10.0.zip
Downloading: "https://download.pytorch.org/models/inception_v3_google-0cc3c7bd.pth" to /root/.cache/torch/hub/checkpoints/inception_v3_google-0cc3c7bd.pth


  0%|          | 0.00/104M [00:00<?, ?B/s]

44.804162487089286

In [None]:
!pip install face_recognition
#https://github.com/ageitgey/face_recognition

Looking in indexes: https://pypi.org/simple, https://us-python.pkg.dev/colab-wheels/public/simple/
Collecting face_recognition
  Downloading face_recognition-1.3.0-py2.py3-none-any.whl (15 kB)
Collecting face-recognition-models>=0.3.0
  Downloading face_recognition_models-0.3.0.tar.gz (100.1 MB)
[K     |████████████████████████████████| 100.1 MB 27 kB/s 
Building wheels for collected packages: face-recognition-models
  Building wheel for face-recognition-models (setup.py) ... [?25l[?25hdone
  Created wheel for face-recognition-models: filename=face_recognition_models-0.3.0-py2.py3-none-any.whl size=100566186 sha256=cba380b1b21f7a3974ddab1d1c4f5271acd1d72802c6fd7548d9f5dda62b6b7d
  Stored in directory: /root/.cache/pip/wheels/d6/81/3c/884bcd5e1c120ff548d57c2ecc9ebf3281c9a6f7c0e7e7947a
Successfully built face-recognition-models
Installing collected packages: face-recognition-models, face-recognition
Successfully installed face-recognition-1.3.0 face-recognition-models-0.3.0


In [None]:
import face_recognition

def face_recognition_experiment():
  #I assume that known_sample_i corresponds to test_sample_i
  known_faces = []
  #TODO: how many samples exist? assign to sample_number
  sample_number = 70
  sample_numbers = list(range(sample_number))
  for i in range(sample_number):
    #image = face_recognition.load_image_file("known_sample_" + str(i) + ".jpg")
    image = face_recognition.load_image_file("exp13/"+str(i) + ".jpg")
    if len(face_recognition.face_encodings(image)) > 0:
      face_encoding = face_recognition.face_encodings(image)[0]
      known_faces.append(face_encoding)
    else:
      sample_numbers.remove(i)

  number_of_accurates = 0
  for i, file_i in enumerate(sample_numbers):
    #unknown_image = face_recognition.load_image_file("test_sample_" + str(i) + ".jpg")
    unknown_image = face_recognition.load_image_file(str(file_i) + ".jpg")
    unknown_face_encoding = face_recognition.face_encodings(unknown_image)[0]
    results = face_recognition.compare_faces(known_faces, unknown_face_encoding)
    
    accurate = True
    for j, result in enumerate(results):
      accurate = accurate and ((j == i) == result)
      accurate = accurate and ((j != i) != result)
    #print(accurate)
    if accurate:
      number_of_accurates += 1 

  return number_of_accurates / sample_number


In [None]:
face_recognition_experiment()

0.5714285714285714