In [None]:
import torch
import torch.nn as nn
import torch.nn.functional as F
import torch.optim as optim

import matplotlib.pyplot as plt
import numpy as np
import pandas as pd
import datetime

import utils.models as models
import utils.plotting as plotting
import utils.dataloaders as dl
import utils.traintest as tt
import utils.adversarial as adv
import utils.eval as ev
import utils.gmm_helpers as gmm_helpers
import model_params as params

from importlib import reload

import utils.mc_dropout as mc

import argparse

reload(mc)

dataset = 'MNIST'

saving_string = dataset + '_base'
device = torch.device('cuda:1')

model_params = params.params_dict[dataset](augm_flag=True)

def train(model, device, train_loader, optimizer, epoch, 
          verbose=100, noise_loader=None, epsilon=.3):
    
    criterion = nn.NLLLoss()
    model.train()
    
    train_loss = 0
    correct = 0
    

    for batch_idx, (data, target) in enumerate(train_loader):
        data, target = data.to(device), target.to(device)
        
        #output = F.log_softmax(model(data), dim=1)
        output = model(data)
        
        loss = criterion(output, target)
        
        optimizer.zero_grad()
        loss.backward()
        optimizer.step()
        
        train_loss += loss.item()
        _, predicted = output.max(1)
        correct += predicted.eq(target).sum().item()
        if (batch_idx % verbose == 0) and verbose>0:
            print('Train Epoch: {} [{}/{} ({:.0f}%)]\tLoss: {:.6f}'.format(
                epoch, batch_idx * len(data), len(train_loader.dataset),
                100. * batch_idx / len(train_loader), loss.item()))
    return train_loss/len(train_loader.dataset), correct/len(train_loader.dataset)


if dataset=='MNIST':
    model = mc.LeNet()
elif dataset=='FMNIST':
    model = mc.vgg13(in_channels=1, num_classes=10)
elif dataset in ['SVHN', 'CIFAR10']:
    model = mc.vgg13(in_channels=3, num_classes=10)
elif dataset=='CIFAR100':
    model = mc.vgg13(in_channels=3, num_classes=100)


model = model.to(device)


param_groups = [{'params':model.parameters(),'lr':model_params.lr, 'weight_decay':5e-4}]
    
if dataset=='MNIST':
    optimizer = optim.Adam(param_groups)
else: 
    optimizer = optim.SGD(param_groups, momentum=0.9)


for epoch in range(100):
    if epoch+1 in [50,75,90]:
        for group in optimizer.param_groups:
            group['lr'] *= .1
 
    trainloss, correct_train = train(model, device, model_params.train_loader,  
                                     optimizer, epoch, verbose=-1)
    print(str(epoch) + ': \t' + str(correct_train))

model = model.to('cpu')

In [39]:
reload(mc)
mc_model = mc.MC_Model(model, iterations=7, classes=model_params.classes)
mc_model.cpu()

MC_Model(
  (model): LeNet(
    (conv1): Conv2d(1, 32, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
    (conv2): Conv2d(32, 64, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))
    (fc1): Linear(in_features=3136, out_features=1024, bias=True)
    (fc2): Linear(in_features=1024, out_features=10, bias=True)
    (dropout): MC_dropout(p=0.5)
  )
)

In [8]:
torch.save(mc_model, 'SavedModels/other/mcdo/' + dataset + '.pth')

tensor(0.4970)

In [32]:
x = torch.ones(10, 1, 28, 28)

In [35]:
mc_model(x)

tensor([[   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -0.8305,    -inf],
        [   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -0.8897,    -inf],
        [-0.8881,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -0.8656,    -inf],
        [   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -0.8931,    -inf],
        [   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -0.8683,    -inf],
        [-0.9066,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [-0.8565,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [-0.8324,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [   -inf,  

In [37]:
data = next(iter(model_params.test_loader))[0]

In [40]:
mc_model(data)

tensor([[    -inf,     -inf,     -inf,     -inf,     -inf,     -inf,     -inf,
          -9.3331,     -inf,     -inf],
        [    -inf,     -inf, -10.6661,     -inf,     -inf,     -inf,     -inf,
             -inf,     -inf,     -inf],
        [    -inf, -10.6220,     -inf,     -inf,     -inf,     -inf,     -inf,
             -inf,     -inf,     -inf],
        [-10.3072,     -inf,     -inf,     -inf,     -inf,     -inf,     -inf,
             -inf,     -inf,     -inf],
        [    -inf,     -inf,     -inf,     -inf, -12.7620,     -inf,     -inf,
             -inf,     -inf,     -inf],
        [    -inf,  -8.3448,     -inf,     -inf,     -inf,     -inf,     -inf,
             -inf,     -inf,     -inf],
        [    -inf,     -inf,     -inf,     -inf, -10.4289,     -inf,     -inf,
             -inf,     -inf,     -inf],
        [    -inf,     -inf,     -inf,     -inf,     -inf,     -inf,     -inf,
             -inf,     -inf,  -7.6124],
        [    -inf,     -inf,     -inf,     -inf,

In [41]:
mc_model(x)

tensor([[-3.0968,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [-3.7206,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -2.9970,    -inf],
        [   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -3.6776,    -inf],
        [-2.9564,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [-3.1235,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -3.3417,    -inf],
        [-3.0288,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
            -inf,    -inf],
        [   -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,    -inf,
         -3.3627,    -inf],
        [   -inf,  