In [60]:
import torch
import torch.nn as nn
import torchvision
import torchvision.transforms as transforms
import os
from tqdm import tqdm
from pylab import *

In [61]:

# Device configuration
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

# Hyper-parameters 
input_size = 784
hidden_size = 500
num_classes = 10
num_epochs = 15
batch_size = 100
learning_rate = 0.001

# MNIST dataset 
train_dataset = torchvision.datasets.KMNIST(root='../../data',      
                                           train=True, 
                                           transform=transforms.ToTensor(),
                                           download=True)

test_dataset = torchvision.datasets.KMNIST(root='../../data', 
                                          train=False, 
                                          transform=transforms.ToTensor())

# Data loader
train_loader = torch.utils.data.DataLoader(dataset=train_dataset, 
                                           batch_size=batch_size, 
                                           shuffle=True)

test_loader = torch.utils.data.DataLoader(dataset=test_dataset, 
                                          batch_size=batch_size, 
                                          shuffle=False)



In [None]:
class NeuralNet(nn.Module):
    def __init__(self,input_size,hidden_size,num_classes):
        super(NeuralNet,self).__init__()
        self.fc1=nn.Linear(input_size,hidden_size)
        self.relu=nn.ReLU()
        self.fc2=nn.Linear(hidden_size,num_classes)
        
    def forward(self,x):
        out=self.fc1(x)
        out=self.relu(out)
        out=self.fc2(out)
        return out
    
model=NeuralNet(input_size,hidden_size,num_classes).to(device)

#loss and optimiser
criterion=nn.CrossEntropyLoss()
optimizer=torch.optim.Adam(model.parameters(),lr=learning_rate)        

In [62]:

class Kuzushiji(nn.Module):
    def __init__(self):
        super(Kuzushiji, self).__init__()
        self.pad1 = nn.ZeroPad2d((2, 2))
        
        self.layer1 = nn.Sequential(
        nn.Conv2d(in_channels=1, out_channels=32, kernel_size=(7, 7), stride=(1, 1), bias=False), 
        nn.BatchNorm2d(num_features=32),
        nn.MaxPool2d(kernel_size=(2,2)),
        nn.ReLU()
        )
    
        
        self.layer2 = nn.Sequential(
        nn.Conv2d(in_channels=32, out_channels=64, kernel_size=(5, 5), stride=(1, 1), bias=False), 
        nn.BatchNorm2d(num_features=64),
        nn.ReLU()
        )
        
        self.layer3 = nn.Sequential(
        nn.Conv2d(in_channels=64, out_channels=128, kernel_size=(3, 3), stride=(1, 1), bias=False), 
        nn.BatchNorm2d(num_features=128),
        nn.MaxPool2d(kernel_size=(2,2)),
        nn.ReLU()
        )
        
        self.fc1 = nn.Sequential(
        nn.Linear(in_features=768, out_features=512),
        nn.ReLU()
        )
        self.dropout1 = nn.Dropout(p=0.2)
        
        self.fc2 = nn.Sequential(
        nn.Linear(in_features=512, out_features=10),
        nn.Softmax()
        )
        
    def forward(self, x):
        x = self.pad1(x)
        x = self.layer1(x)
        x = self.layer2(x)
        x = self.layer3(x)
        x = x.reshape(x.shape[0], -1)
       # print(x.shape)
        x = self.fc1(x)
        x = self.dropout1(x)
        out = self.fc2(x)
        
        return out,x

In [63]:
my_model=Kuzushiji().to(device)
criterion=nn.CrossEntropyLoss()
optimizer=torch.optim.Adam(my_model.parameters(),lr=learning_rate)

RuntimeError: CUDA error: device-side assert triggered

In [None]:
# Train the model
total_step = len(train_loader)
for epoch in range(num_epochs):
    for i, (images, labels) in enumerate(train_loader):  
        # Move tensors to the configured device
        images = images.reshape(-1, 1, 28,28).to(device)
        labels = labels.to(device)
        
        # Forward pass
        outputs = my_model(images)[0]
        loss = criterion(outputs, labels)
        
        # Backward and optimize
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        if (i+1) % 100 == 0:
            print ('Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}' 
                   .format(epoch+1, num_epochs, i+1, total_step, loss.item()))

In [None]:
# Normal Model Testing
with torch.no_grad():
    correct=0
    total=0
    for images,labels in test_loader:
        images=images.reshape(-1,1,28,28).to(device)
        labels=labels.to(device)
        outputs=my_model(images)[0]
        _,predicted=torch.max(outputs.data,1)
        total+=labels.size(0)
        correct+=(predicted==labels).sum().item()
        
    print('Accuracy of the network on the 10000 test images: {} %'.format(100 * correct / total))

# FGSM Analysis

In [None]:
for param in my_model.parameters():
    param.requires_grad=False

# Targeted FGSM attack 

In [None]:
#targeted fgsm 

#epsilon=[0.0001,0.0003,0.001,0.003,0.1,0.2,0.3,0.4,0.5]
pred_list=[]
epsilon=[0.3]

for value in epsilon:
    pred_val_list=[]
    for k in range(2,3):
        l_tfgsm=[]
        sign=[]
        #actual=[]
        for i,(images,labels) in enumerate(test_loader):
            copyOf_images=images.clone().detach()
            copyOf_images=copyOf_images.reshape(-1,1,28,28).to(device)
            copyOf_images.requires_grad=True
            target_class=(labels+k)%10  #missing classifying it with 10 classes though it has to be correct at least once
            target_class=target_class.to(device)

            #forward pass
            outputs=my_model(copyOf_images)[0]
            loss=criterion(outputs,target_class)

            #backward and optimize
            optimizer.zero_grad()
            loss.backward()
            c=copyOf_images.grad.sign()
            #actual.append((images,labels))
            copyOf_images=copyOf_images-(value*c) 
            copyOf_images=torch.clamp(copyOf_images,0,1)
            sign.append(c)
            l_tfgsm.append((copyOf_images,images,labels))

        with torch.no_grad():
            correct=0
            total=0
            for images,trueimages,labels in l_tfgsm:
                images=images.reshape(-1,1,28,28).to(device)
                labels=labels.to(device)
                outputs=my_model(images)[0]
                _,predicted=torch.max(outputs.data,1)
                total+=labels.size(0)
                correct+=(predicted==labels).sum().item()
            pred_val_list.append(100*correct/total)
            print("accuracy of the network on the 10000 test images for epsilon value {}:{} %".format(value,100*correct/total)) 
    pred_list.append(pred_val_list)

In [None]:
print(pred_list)

import matplotlib.pyplot as plt

make_list=[]
epsilon=[0.0001,0.0003,0.001,0.003,0.1,0.2,0.3,0.4,0.5]

for k in pred_list:
    make_list.append(k[2])
plt.plot(epsilon,make_list)
plt.xlabel("Epsilon Value")
plt.ylabel("Accuracy(in %)")
plt.title("Targeted FGSM on Kuzushiji where Target labels =(True label+2)%10")
plt.show()

In [None]:
# Untargeted FGSM attack 
l=[]
sign=[]
actual=[]
epsilon=[0.0001,0.0003,0.001,0.003,0.1,0.2,0.3,0.4,0.5]

for value in epsilon:
   # for k in range(10):
        l=[]
        sign=[]
        #actual=[]
        for i,(images,labels) in enumerate(test_loader):
            copyOf_images=images.clone().detach()
            copyOf_images=copyOf_images.reshape(-1,1,28,28).to(device)
            copyOf_images.requires_grad=True
            #target_class=(labels+k)%10  #missing classifying it with 10 classes though it has to be correct at least once
            target_class=labels
            target_class=target_class.to(device)
            
            #forward pass
            outputs=my_model(copyOf_images)
            loss=criterion(outputs,target_class)

            #backward and optimize
            optimizer.zero_grad()
            loss.backward()
            c=copyOf_images.grad.sign()
            #actual.append((images,labels))
            copyOf_images=copyOf_images+(value*c) 
            copyOf_images=torch.clamp(copyOf_images,0,1)
            sign.append(c)
            l.append((copyOf_images,labels))

        with torch.no_grad():
            correct=0
            total=0
            for images,labels in l:
                images=images.reshape(-1,1,28,28).to(device)
                labels=labels.to(device)
                outputs=my_model(images)
                _,predicted=torch.max(outputs.data,1)
                total+=labels.size(0)
                correct+=(predicted==labels).sum().item()
            print("accuracy of the network on the 10000 test images for epsilon value {}:{} %".format(value,100*correct/total)) 

In [None]:
#checking the accuracy after FGSM attack

with torch.no_grad():
    correct=0
    total=0
    for images,labels in l:
        images=images.reshape(-1,1,28,28).to(device)
        labels=labels.to(device)
        outputs=my_model(images)
        _,predicted=torch.max(outputs.data,1)
        total+=labels.size(0)
        correct+=(predicted==labels).sum().item()
    print("accuracy of the network on the 10000 test images:{} %".format(100*correct/total))

In [None]:
def to_var(x, requires_grad=False, volatile=False):
    """
    Varialbe type that automatically choose cpu or cuda
    """
    if torch.cuda.is_available():
        x = x.cuda()
    return Variable(x, requires_grad=requires_grad, volatile=volatile)

In [None]:
#PGD Attack 

class LinfPGDAttack(nn.Module):
    
    def __init__(self,model=None,epsilon=0.3,k=40,a=0.01,random_start=True):
        super(LinfPGDAttack, self).__init__()
        self.model=model
        self.epsilon=epsilon
        self.k=k
        self.a=a
        self.randn=random_start
        self.loss_fn=nn.CrossEntropyLoss() 
    
    def perturb(self,X_nat,y):
        
        if self.randn:
            X=X_nat+np.random.uniform(-self.epsilon,self.epsilon,X_nat.shape).astype('float32')
        else:
            X=np.copy(X_nat)
        
        for i in range(self.k):
            X_var=to_var(torch.from_numpy(X),requires_grad=True)
            y_var=to_var(torch.LongTensor(y))
            
            scores=self.model(X_var)[0]
            loss=self.loss_fn(scores,y_var)
            loss.backward()
            grad=X_var.grad.data.cpu().numpy()
            
            X-=self.a*np.sign(grad)
            
            X=np.clip(X,X_nat-self.epsilon,X_nat+self.epsilon)
            X=np.clip(X,0,1)
        
        return X

In [None]:
from torch.autograd import Variable

l=[]
#perturbed_images=[]
epsilon=[0.001,0.003,0.01,0.03,0.1,0.2,0.3,0.4,0.5]
tmp_list=[]

for value in epsilon:
    for i,(images,labels) in enumerate(test_loader):       
        PGDobj=LinfPGDAttack(model=my_model,random_start=False,epsilon=value)
        target=(labels+1)%10  #generating the target
        Changed_Images=PGDobj.perturb(images.numpy(),target.numpy())
        if np.array_equal(Changed_Images,images.numpy()):
            print("No change")
            break        
        l.append((torch.from_numpy(Changed_Images),labels))
        if(i%50==0):
            print("Now adding changed images in {}th iteration".format(i))

    with torch.no_grad():
        correct=0
        total=0
        for images,labels in l:
            images=images.reshape(-1,1,28,28).to(device)
            labels=labels.to(device)
            outputs=my_model(images)[0]
            _,predicted=torch.max(outputs.data,1)
            total+=labels.size(0)
            correct+=(predicted==labels).sum().item()
        tmp_list.append(100*correct/total)
        print("accuracy of the network on the 10000 test images:{} %".format(100*correct/total))

In [None]:
from torch.autograd import Variable

l=[]
#perturbed_images=[]
a=[0.001,0.003,0.01,0.03,0.1,0.2,0.3,0.4,0.5]
tmp_list=[]

for value in epsilon:
    for i,(images,labels) in enumerate(test_loader):       
        PGDobj=LinfPGDAttack(model=my_model,random_start=False,a=value)
        target=(labels+1)%10  #generating the target
        Changed_Images=PGDobj.perturb(images.numpy(),target.numpy())
        if np.array_equal(Changed_Images,images.numpy()):
            print("No change")
            break        
        l.append((torch.from_numpy(Changed_Images),labels))
        if(i%50==0):
            print("Now adding changed images in {}th iteration".format(i))

    with torch.no_grad():
        correct=0
        total=0
        for images,labels in l:
            images=images.reshape(-1,1,28,28).to(device)
            labels=labels.to(device)
            outputs=my_model(images)
            _,predicted=torch.max(outputs.data,1)
            total+=labels.size(0)
            correct+=(predicted==labels).sum().item()
        tmp_list.append(100*correct/total)
        print("accuracy of the network on the 10000 test images:{} %".format(100*correct/total))

In [None]:
import matplotlib.pyplot as plt

plt.plot(a,tmp_list)
plt.title("Targeted PGD over Kuzushiji")
plt.ylabel("Accuracy")
plt.xlabel("Value of One Step of Gradient Descent")

In [None]:
#checking the accuracy after FGSM attack
with torch.no_grad():
    correct=0
    total=0
    for images,labels in l:
        images=images.reshape(-1,1,28,28).to(device)
        labels=labels.to(device)
        outputs=my_model(images)
        _,predicted=torch.max(outputs.data,1)
        total+=labels.size(0)
        correct+=(predicted==labels).sum().item()
    
    print("accuracy of the network on the 10000 test images:{} %".format(100*correct/total))

# Carlini Wagner Attack

In [None]:
# CW-L2 Attack
# Based on the paper, i.e. not exact same version of the code on https://github.com/carlini/nn_robust_attacks
# (1) Binary search method for c, (2) Optimization on tanh space, (3) Choosing method best l2 adversaries is NOT IN THIS CODE.
def cw_l2_attack(model, images, labels, targeted=False, c=1e-4, kappa=0, max_iter=200, learning_rate=0.01) :

    images = images.to(device)     
    labels = labels.to(device)

    # Define f-function
    def f(x) :

        outputs = model(x)[1]  #taking penultimate layer in this case rather than the softmax layer
        one_hot_labels = torch.eye(len(outputs[0]))[labels].to(device)

        i, _ = torch.max((1-one_hot_labels)*outputs, dim=1)
        j = torch.masked_select(outputs, one_hot_labels.byte())
        
        # If targeted, optimize for making the other class most likely 
        if targeted :
            return torch.clamp(i-j, min=-kappa)
        
        # If untargeted, optimize for making the other class most likely 
        else :
            return torch.clamp(j-i, min=-kappa)
    
    w = torch.zeros_like(images, requires_grad=True).to(device)

    optimizer = torch.optim.Adam([w], lr=learning_rate)

    prev = 1e10
    
    for step in tqdm(range(max_iter)) :

        a = 1/2*(nn.Tanh()(w) + 1)

        loss1 = nn.MSELoss(reduction='sum')(a, images)
        loss2 = torch.sum(c*f(a))

        cost = loss1 + loss2

        optimizer.zero_grad()
        cost.backward()
        optimizer.step()

        # Early Stop when loss does not converge.
        if step % (max_iter//10) == 0 :
            if cost > prev :
                print('Attack Stopped due to CONVERGENCE....')
                return a
            prev = cost
        
        print('- Learning Progress : %2.2f %%        ' %((step+1)/max_iter*100), end='\r')

    attack_images = 1/2*(nn.Tanh()(w) + 1)

    return attack_images

In [None]:
print("Attack Image & Predicted Label")

#kappa=[0.01,0.03,1,3,5,7,9]
#options=[0.01,0.03,0.1,0.2,0.3,0.4,0.5]
options=[0.5]
tmp_list=[]
l=[]
for value in options:
    correct = 0
    total = 0
    for i,(images, labels) in enumerate(test_loader):
        if (i<20):
            #target=(labels+2)%10 
            images_ = cw_l2_attack(my_model, images, labels, targeted=True,c=value,kappa=5)
            #images = cw_l2_attack(my_model, images, target, c=0.1)
            labels = labels.to(device)
            outputs = my_model(images_)[0]
            
            _, pre = torch.max(outputs.data, 1)
            l.append((images_,images,labels))
            total+=labels.size(0)
            correct += (pre == labels).sum().item()

            #imshow(torchvision.utils.make_grid(images.cpu().data, normalize=True), [normal_data.classes[i] for i in pre])
    tmp_list.append(100*float(correct)/total)
    print('Accuracy of test text: %f %%' % (100 * float(correct) / total))

In [None]:
np.asarray(l).shape

In [None]:
print(tmp_list)

import matplotlib.pyplot as plt
plt.title("Targeted L2 Carlini Wagner Attack on Kuzushiji")
plt.xlabel("Different k values keeping c=0.3,learning_rate=0.01,num_iters=200")
plt.ylabel("Accuracy")
plt.plot(kappa_list,tmp_list)

In [None]:
tmp_list

In [None]:
tmp_list

import matplotlib.pyplot as plt
plt.title("Targeted L2 Carlini Wagner Attack on Kuzushiji")
plt.xlabel("Different c values keeping k=5,learning_rate=0.01,num_iters=200")
plt.ylabel("Accuracy")
plt.plot(options,tmp_list)

In [None]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torchvision
from torchvision import transforms
from torchvision.utils import save_image

In [None]:

# Device configuration
device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')

# Create a directory if not exists
sample_dir = 'samples'
if not os.path.exists(sample_dir):
    os.makedirs(sample_dir)

# Hyper-parameters
image_size = 784
h_dim = 400
z_dim = 60
num_epochs = 20
batch_size = 64
learning_rate = 2e-3

# MNIST dataset
dataset = torchvision.datasets.KMNIST(root='../../data',
                                     train=True,
                                     transform=transforms.ToTensor(),
                                     download=True)

# Data loader
data_loader = torch.utils.data.DataLoader(dataset=dataset,
                                          batch_size=batch_size, 
                                          shuffle=True)


# VAE model
class VAE(nn.Module):
    def __init__(self, image_size=784, h_dim=400, z_dim=60):
        super(VAE, self).__init__()
        self.fc1 = nn.Linear(image_size, 500)
        self.fc2 = nn.Linear(500, 300)
        self.fc3 = nn.Linear(300, 150)
        self.fc4 = nn.Linear(150, z_dim)
        self.fc41 = nn.Linear(150, z_dim)
        self.fc5 = nn.Linear(z_dim, 150)
        self.fc6 = nn.Linear(150, 300)
        self.fc7 = nn.Linear(300, 500)
        self.fc8 = nn.Linear(500, image_size)
        
    def encode(self, x):
        h = F.relu(self.fc1(x))
        h = F.relu(self.fc2(h))
        h = F.relu(self.fc3(h))
        return self.fc4(h), self.fc41(h)
    
    def reparameterize(self, mu, log_var):
        std = torch.exp(log_var/2)
        eps = torch.randn_like(std)
        return mu + eps * std

    def decode(self, z):
        h = F.relu(self.fc5(z))
        h = F.relu(self.fc6(h))
        h = F.relu(self.fc7(h))
        return F.sigmoid(self.fc8(h))
    
    def forward(self, x):
        mu, log_var = self.encode(x)
        z = self.reparameterize(mu, log_var)
        x_reconst = self.decode(z)
        return x_reconst, mu, log_var

model = VAE().to(device)
optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)

# Start training
for epoch in range(num_epochs):
    for i, (x, _) in enumerate(data_loader):
        # Forward pass
        x = x.to(device).view(-1, image_size)
        x_reconst, mu, log_var = model(x)
        
        # Compute reconstruction loss and kl divergence
        # For KL divergence, see Appendix B in VAE paper or http://yunjey47.tistory.com/43
        reconst_loss = F.binary_cross_entropy(x_reconst, x, size_average=False)
        kl_div = - 0.5 * torch.sum(1 + log_var - mu.pow(2) - log_var.exp())
        
        # Backprop and optimize
        loss = reconst_loss + kl_div
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        if (i+1) % 200 == 0:
            print ("Epoch[{}/{}], Step [{}/{}], Reconst Loss: {:.4f}, KL Div: {:.4f}, TOTAL : {:.4f}" 
                   .format(epoch+1, num_epochs, i+1, len(data_loader), reconst_loss.item(), kl_div.item(), kl_div.item()+reconst_loss.item()))


In [None]:
l[0][0].shape

# Result for Defense on CW Attack using VAE

In [None]:
with torch.no_grad():
    
    correct=0
    total=0
    for attacked,trueimages,labels in l:
        
        attacked=trueimages.reshape(-1,1,28,28).to(device)
        labels=labels.to(device)
        
        vae_input = attacked.view(-1, image_size)
        attacked_reconstructed, mu, log_var = model(vae_input)
        attacked_reconstructed=attacked_reconstructed.view(-1,1,28,28)
        outputs=my_model(attacked_reconstructed)[0]
        
        _,predicted=torch.max(outputs.data,1)
        total+=labels.size(0)
        correct+=(predicted==labels).sum().item()
        print('Accuracy of the network on the attacked images so far: {} %'.format(100 * correct / total))
        
    print('Final Accuracy of the network on the attacked images: {} %'.format(100 * correct / total))
    

# Result for Defense against Targeted FGSM Attack using VAE

In [None]:
with torch.no_grad():
    
    correct=0
    total=0
    for attacked,trueimages,labels in l_tfgsm:
        
        attacked=trueimages.reshape(-1,1,28,28).to(device)
        labels=labels.to(device)
        
        vae_input = attacked.view(-1, image_size)
        attacked_reconstructed, mu, log_var = model(vae_input)
        attacked_reconstructed=attacked_reconstructed.view(-1,1,28,28)
        outputs=my_model(attacked_reconstructed)[0]
        
        _,predicted=torch.max(outputs.data,1)
        total+=labels.size(0)
        correct+=(predicted==labels).sum().item()
        print('Accuracy of the network on the attacked images so far: {} %'.format(100 * correct / total))
        
    print('Final Accuracy of the network on the attacked images: {} %'.format(100 * correct / total))
    

# Defense VAE using KNN methodology

In [None]:
# l contains values for the CW attack
# l_tgsm contains the value for the tfgsm attack

from sklearn.neighbors import NearestNeighbors

N=1000 #generating N random images from Z space

with torch.no_grad():
    # Save the sampled images
    z = torch.randn(N, z_dim).to(device)
    output = model.decode(z)  #generation of N images
    print(output.shape)
    out= output.view(-1,image_size)
    
samples=out.cpu().numpy()
#print(numpy_out.shape)
neigh=NearestNeighbors(n_neighbors=1)
neigh.fit(samples)

correct=0
total=0

for attacked,trueimages,labels in l:
    #implementing the K-NN on the attacked
    
    temp=attacked.view(-1,image_size).detach()
    numpy_attacked=temp.cpu().numpy()
    result=neigh.kneighbors(numpy_attacked)
    #result[1] is a numpy array containing the index of the closest image in the sample space
    index=list(result[1].flatten())
    #print(index)
    ClosestImage=output[index,:]
    input_to_classifier=ClosestImage.view(-1,1,28,28)
    print(input_to_classifier.shape)
    output=my_model(input_to_classifier)[0]
    _,predicted=torch.max(outputs.data,1)
    total+=labels.size(0)
    correct+=(predicted==labels).sum().item()
    print('Accuracy of the network on the attacked images so far: {} %'.format(100 * correct / total))
        
print('Final Accuracy of the network on the attacked images: {} %'.format(100 * correct / total))

In [None]:
print(device)

# VAE Testing

In [None]:
with torch.no_grad():
    # Save the sampled images
    z = torch.randn(batch_size, z_dim).to(device)
    out = model.decode(z).view(-1, 1, 28, 28)

In [None]:
with torch.no_grad():
    # Save the sampled images
    z = torch.randn(batch_size, z_dim).to(device)
    out = model.decode(z).view(-1, 1, 28, 28)
    
print(out.shape)
out = out.reshape(-1, 28,28).cpu().numpy()
print(out.shape)
import matplotlib.pyplot as plt
from pylab import * 
rangee = 3
for k in range(1, rangee):
    subplot(2, rangee, k)
    plt.axis('off')
    imshow(out[k], cmap='Greys')
    subplot(2, rangee, k+rangee)
    imshow(out[k+rangee], cmap='Greys')
    plt.axis('off')   

In [None]:
for epoch in range(num_epochs):
    for i, (x, _) in enumerate(data_loader):
        # Forward pass
        x = x.to(device).view(-1, image_size)
        x_reconst, mu, log_var = model(x)
        
        # Compute reconstruction loss and kl divergence
        # For KL divergence, see Appendix B in VAE paper or http://yunjey47.tistory.com/43
        reconst_loss = F.binary_cross_entropy(x_reconst, x, size_average=False)
        kl_div = - 0.5 * torch.sum(1 + log_var - mu.pow(2) - log_var.exp())
        
        # Backprop and optimize
        loss = reconst_loss + 0.8*kl_div
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        if (i+1) % 200 == 0:
            print ("Epoch[{}/{}], Step [{}/{}], Reconst Loss: {:.4f}, KL Div: {:.4f}, TOTAL : {:.4f}" 
                   .format(epoch+1, num_epochs, i+1, len(data_loader), reconst_loss.item(), kl_div.item(), kl_div.item()+reconst_loss.item()))


# Following are just snippet tests,they don't mean anything as such


In [None]:
im,_=l[0]
im=im.data.cpu().numpy()

In [None]:
old_im,_=actual[0]
old_im=old_im.data.cpu().numpy()

In [None]:
im=im.reshape(100,28,28)
old_im=old_im.reshape(100,28,28)

In [None]:
import matplotlib.pyplot as plt

In [None]:
plt.imshow(old_im[2])

In [None]:
plt.imshow(im[2])

In [None]:
#these ae just snippet tests they don't mean anything now
subplot(1,2,1)
title('adversarial example')
imshow(im[2],cmap='gray')
subplot(1,2,2)
title('actual sample')
imshow(old_im[2],cmap='gray')

In [None]:
image1=torch.from_numpy(im[1])
img_t1=image1.reshape(-1,1,28,28).to(device)
outputs=my_model(img_t1)
_,predicted=torch.max(outputs.data,1)
print(predicted)

image2=torch.from_numpy(old_im[1])
img_t2=image2.reshape(-1,1,28,28).to(device)
outputs=my_model(img_t2)
_,predicted=torch.max(outputs.data,1)
print(predicted)

**Training a GAN **




In [None]:
g_input_size=10
g_hidden_size=5
g_output_size=

d_input_size=
d_hidden_size=10
d_output_size=1
minibatch_size=d_input_size 

generator_activation_function=torch.tanh
discriminator_activation_function=torch.sigmoid

In [None]:
def get_generator_input_sampler():
    return lambda n: torch.Tensor(np.random.normal(0,1,(g_input_size,1)))  #whatever is the size of the random input noise here 50*1

In [None]:
class Generator(nn.Module):
    def __init__(self,input_size,hidden_size,output_size,f):
        super(Generator,self).__init__()
        self.map1=nn.Linear(input_size,hidden_size)
        self.map2=nn.Linear(hidden_size,hidden_size)
        self.map3=nn.Linear(hidden_size,output_size)
        self.f=f
    def forward(self,x):
        x=self.map1(x)
        x=self.f(x)
        x=self.map2(x)
        x=self.f(x)
        x=self.map3(x)
        return x

In [None]:
def Discriminator(nn.Module):
    def __init__(self,input_size,hidden_size,output_size,f):
        super(Discriminator,self).__init__()
        self.map1=nn.Linear(input_size,hidden_size)
        self.map2=nn.Linear(hidden_size,hidden_size)
        self.map3=nn.Linear(hidden_size,output_size)
        self.f=f
    def forward(self,x):
        x=self.f(self.map1(x))
        x=self.f(self.map2(x))
        x=self.f(self.map3(x))
        return x

In [None]:
G=Generator(input_size=g_input_size,
           hidden_size=g_hidden_size,
           output_size=g_output_size,
           f=generator_activation_function)

D=Discriminator(input_size=d_input_size,
           hidden_size=d_hidden_size,
           output_size=d_output_size,
           f=discriminator_activation_function)


In [None]:
Number_epochs=50
D_steps=5

for epoch in range(Number_epochs):
    for d_index in range(D_steps):
        #train D on real+fake
        D
        