In [1]:
%matplotlib notebook
import cvxpy as cp
import dccp
import torch
import numpy as np
from cvxpylayers.torch import CvxpyLayer
import matplotlib.pyplot as plt
from mpl_toolkits.mplot3d import Axes3D
from sklearn import svm
from sklearn.metrics import zero_one_loss, confusion_matrix
from scipy.io import arff
import pandas as pd
import time
import torch.optim as optim
from torch.utils.data import TensorDataset, DataLoader
from sklearn.datasets import make_classification
from sklearn.utils import shuffle
import matplotlib.patches as mpatches
import json
import random
import math
import os, psutil
from datetime import datetime

torch.set_default_dtype(torch.float64)
torch.manual_seed(0)
np.random.seed(0)

XDIM = 2
TRAIN_SLOPE = 1
EVAL_SLOPE = 5
COST = 1./XDIM
EPSILON = 0.005
X_LOWER_BOUND = -10
X_UPPER_BOUND = 10

In [2]:
def visualize_data2D(X, Y):
    if not XDIM == 2:
        return
    
    Xpos = X[Y == 1]
    Xneg = X[Y == -1]
    fig = plt.figure()
    ax = fig.add_subplot(111)
    ax.scatter(Xpos[:, 0], Xpos[:, 1], marker='+', color='green')
    ax.scatter(Xneg[:, 0], Xneg[:, 1], marker='_', color='purple')
    plt.show()
    
def visualize_weights(w1, b1, w2, b2):
    fig = plt.figure()
    plt.bar(np.arange(XDIM + 1), np.append(w1, b1), color='b', alpha=0.5)
    plt.bar(np.arange(XDIM + 1), np.append(w2, b2), color='r', alpha=0.5)
    plt.show()
    
def visualize_data3D(X, Y):
    if not XDIM == 3:
        return
    
    Xpos = X[Y == 1][:100]
    Xneg = X[Y == -1][:100]
    fig = plt.figure()
    ax = fig.add_subplot(111, projection='3d')
    ax.scatter(Xpos[:, 0], Xpos[:, 1], Xpos[:, 2], marker='+', color='green')
    ax.scatter(Xneg[:, 0], Xneg[:, 1], Xneg[:, 2], marker='_', color='purple')
    plt.show()
    
def visualize_data2D(X, Y):
    if not XDIM == 2:
        return
    
    Xpos = X[Y == 1]
    Xneg = X[Y == -1]
    fig = plt.figure()
    ax = fig.add_subplot(111)
    ax.scatter(Xpos[:, 0], Xpos[:, 1], marker='+', color='green')
    ax.scatter(Xneg[:, 0], Xneg[:, 1], marker='_', color='purple')
    plt.show()
    
def visualize_data(X, Y):
    if XDIM == 2:
        visualize_data2D(X, Y)
    else:
        visualize_data3D(X, Y)
    
def visualize_strategic_data3D(Xval, Xval_opt, Yval, w_non_strategic, b_non_strategic, w_strategic, b_strategic):
    if not XDIM == 3:
        return

    Xpos = Xval[Yval == 1][:50]
    Xneg = Xval[Yval == -1][:50]
    XposOpt = Xval_opt[Yval == 1][:50]
    XnegOpt = Xval_opt[Yval == -1][:50]

    fig = plt.figure()
    ax = fig.add_subplot(111, projection='3d')

    ax.scatter(Xpos[:, 0], Xpos[:, 1], Xpos[:, 2], marker='+', color='blue')
    ax.scatter(Xneg[:, 0], Xneg[:, 1], Xneg[:, 2], marker='_', color='blue')

    ax.scatter(XposOpt[:, 0], XposOpt[:, 1], XposOpt[:, 2], marker='+', color='red')
    ax.scatter(XnegOpt[:, 0], XnegOpt[:, 1], XnegOpt[:, 2], marker='_', color='red')

    range_arr = torch.arange(-2, 2 + 1)
    xx, yy = torch.meshgrid(range_arr, range_arr)
    z = (-w_non_strategic[0] * xx - w_non_strategic[1] * yy - b_non_strategic) * 1. /w_non_strategic[2]
    ax.plot_surface(xx.numpy(), yy.numpy(), z.numpy(), alpha=0.2, color='blue')

    xx, yy = torch.meshgrid(range_arr, range_arr)
    z = (-w_strategic[0] * xx - w_strategic[1] * yy - b_strategic) * 1. /w_strategic[2]
    ax.plot_surface(xx.numpy(), yy.numpy(), z.numpy(), alpha=0.2, color='red')
#     ax.set_xlim3d(-1.2, 1.2)
#     ax.set_ylim3d(-1.2, 1.2)
#     ax.set_zlim3d(-1.2, 1.2)
#     ax.view_init(25, 45)
#     plt.savefig('plots/simple_strategic_classification.pdf', format='pdf')
#     plt.savefig('plots/simple_strategic_classification.eps', format='eps')
#     plt.savefig('plots/simple_strategic_classification.png', format='png')
    plt.show()

def visualize_strategic_data2D(Xval, Xval_opt, Yval, w_non_strategic, b_non_strategic, w_strategic, b_strategic):
    if not XDIM == 2:
        return

    Xpos = Xval[Yval == 1][:50]
    Xneg = Xval[Yval == -1][:50]
    XposOpt = Xval_opt[Yval == 1][:50]
    XnegOpt = Xval_opt[Yval == -1][:50]

    fig = plt.figure()
    ax = fig.add_subplot(111)

    ax.scatter(Xpos[:, 0], Xpos[:, 1], marker='+', color='blue')
    ax.scatter(Xneg[:, 0], Xneg[:, 1], marker='_', color='blue')

    ax.scatter(XposOpt[:, 0], XposOpt[:, 1], marker='+', color='red')
    ax.scatter(XnegOpt[:, 0], XnegOpt[:, 1], marker='_', color='red')

    range_arr = torch.arange(-0.5, 2 + 1)
    xx = torch.meshgrid(range_arr)[0]
    z = (-w_non_strategic[0] * xx - b_non_strategic) * 1. /w_non_strategic[1]
    ax.plot(xx.detach().numpy(), z.detach().numpy(), alpha=0.2, color='blue')

    xx = torch.meshgrid(range_arr)[0]
    z = (-w_strategic[0] * xx - b_strategic) * 1. /w_strategic[1]
    ax.plot(xx.detach().numpy(), z.detach().numpy(), alpha=0.2, color='red')

    plt.show()
    
def visualize_strategic_data(Xval, Xval_opt, Yval, w_non_strategic, b_non_strategic, w_strategic, b_strategic):
    if XDIM == 2:
        visualize_strategic_data2D(Xval, Xval_opt, Yval, w_non_strategic, b_non_strategic, w_strategic, b_strategic)
    else:
        visualize_strategic_data3D(Xval, Xval_opt, Yval, w_non_strategic, b_non_strategic, w_strategic, b_strategic)
        
def visualize_training_errors(train_errors, val_errors):
    fig = plt.figure()
    train_patch, = plt.plot(torch.arange(len(train_errors)), np.mean(train_errors, axis=1), color='blue', label="train")
    val_patch, = plt.plot(torch.arange(len(val_errors)), val_errors, color='orange', label="validation")
    plt.legend(handles=[train_patch, val_patch])

    plt.show()
    
def visualize_training_losses(train_losses, val_losses):
    fig = plt.figure()
    train_patch, = plt.plot(torch.arange(len(train_losses)), np.mean(train_losses, axis=1), color='blue', label="train")
    val_patch, = plt.plot(torch.arange(len(val_losses)), val_losses, color='orange', label="validation")
    plt.legend(handles=[train_patch, val_patch])
    
    plt.show()

# Utils

In [3]:
def split_data(X, Y, percentage):
    num_val = int(len(X)*percentage)
    return X[num_val:], Y[num_val:], X[:num_val], Y[:num_val]

def shuffle(X, Y):
    data = torch.cat((X, Y), 1)
    data = data[torch.randperm(data.size()[0])]
    X = data[:, :2]
    Y = data[:, 2]
    return X, Y

def conf_mat(Y1, Y2):
    num_of_samples = len(Y1)
    mat = confusion_matrix(Y1, Y2, labels=[-1, 1])*100/num_of_samples
    acc = np.trace(mat)
    return mat, acc

def calc_accuracy(Y, Ypred):
    num = len(Y)
    temp = Y - Ypred
    acc = len(temp[temp == 0])*1./num
    return acc

# Dataset

In [4]:
def load_spam_dataset():
    torch.manual_seed(0)
    np.random.seed(0)

    path = r"C:\Users\sagil\Desktop\nir project\tip_spam_data\IS_journal_tip_spam.arff"
    data, meta = arff.loadarff(path)
    df = pd.DataFrame(data)
    most_disc = ['qTips_plc', 'rating_plc', 'qEmail_tip', 'qContacts_tip', 'qURL_tip', 'qPhone_tip', 'qNumeriChar_tip', 'sentistrength_tip', 'combined_tip', 'qWords_tip', 'followers_followees_gph', 'qunigram_avg_tip', 'qTips_usr', 'indeg_gph', 'qCapitalChar_tip', 'class1']
    df = df[most_disc]
    df["class1"].replace({b'spam': -1, b'notspam': 1}, inplace=True)
    df = df.sample(frac=1).reset_index(drop=True)

    Y = df['class1'].values
    X = df.drop('class1', axis = 1).values
    X -= np.mean(X, axis=0)
    X /= np.std(X, axis=0)
    return torch.from_numpy(X), torch.from_numpy(Y)

def gen_custom_data(N, pos_ranges, neg_ranges):
    """
    pos_ranges: a tuple of tensors of length XDIM.
    (scales tensor, offsets tensor)
    """
    torch.manual_seed(0)
    np.random.seed(0)
    pos_samples_num = N//2
    neg_samples_num = N - pos_samples_num
    posX = torch.rand((pos_samples_num, XDIM))*pos_ranges[0] + pos_ranges[1]
    negX = torch.rand((neg_samples_num, XDIM))*neg_ranges[0] + neg_ranges[1]
    
    X = torch.cat((posX, negX), 0)
    Y = torch.unsqueeze(torch.cat((torch.ones(len(posX)), -torch.ones(len(negX))), 0), 1)

    X, Y = shuffle(X, Y)
    return X, Y

# CCP classes

In [5]:
class CCP:
    def __init__(self, x_dim, funcs):
        self.f_derivative = funcs["f_derivative"]
        self.g = funcs["g"]
        self.c = funcs["c"]
        
        self.x = cp.Variable(x_dim)
        self.xt = cp.Parameter(x_dim)
        self.r = cp.Parameter(x_dim)
        self.w = cp.Parameter(x_dim)
        self.b = cp.Parameter(1)
        self.slope = cp.Parameter(1)
        self.v = cp.Parameter(x_dim)

        target = self.x@self.f_derivative(self.xt, self.w, self.b, self.slope)-self.g(self.x, self.w, self.b, self.slope)-self.c(self.x, self.r, self.v)
        constraints = [self.x >= X_LOWER_BOUND,
                       self.x <= X_UPPER_BOUND]
        self.prob = cp.Problem(cp.Maximize(target), constraints)
        
    def ccp(self, r):
        """
        numpy to numpy
        """
        self.xt.value = r
        self.r.value = r
        result = self.prob.solve()
        diff = np.linalg.norm(self.xt.value - self.x.value)
        cnt = 0
        while diff > 0.0001 and cnt < 10:
            cnt += 1
            self.xt.value = self.x.value
            result = self.prob.solve()
            diff = np.linalg.norm(self.x.value - self.xt.value)
        return self.x.value
    
    def optimize_X(self, X, w, b, slope, v):
        """
        tensor to tensor
        """
        w = w.detach().numpy()
        b = b.detach().numpy()
        v = v.detach().numpy()
        slope = np.full(1, slope)
        X = X.numpy()
        
        self.w.value = w
        self.b.value = b
        self.slope.value = slope
        self.v.value = v
        
        return torch.stack([torch.from_numpy(self.ccp(x)) for x in X])

In [6]:
class DELTA():
    
    def __init__(self, x_dim, funcs):
        self.g = funcs["g"]
        self.c = funcs["c_dpp_form"]
        
        self.x = cp.Variable(x_dim)
        self.r = cp.Parameter(x_dim, value = np.random.randn(x_dim))
        self.w = cp.Parameter(x_dim, value = np.random.randn(x_dim))
        self.b = cp.Parameter(1, value = np.random.randn(1))
        self.v = cp.Parameter(XDIM, value = np.random.randn(XDIM))
        self.rv = cp.Parameter(1, value = np.random.randn(1)) # r times v
        self.f_der = cp.Parameter(x_dim, value = np.random.randn(x_dim))

        target = self.x@self.f_der-self.g(self.x, self.w, self.b, TRAIN_SLOPE)-self.c(self.x, self.r, self.v, self.rv)
        constraints = [self.x >= X_LOWER_BOUND,
                       self.x <= X_UPPER_BOUND]
        objective = cp.Maximize(target)
        problem = cp.Problem(objective, constraints)
        self.layer = CvxpyLayer(problem, parameters=[self.r, self.w, self.b, self.v, self.rv, self.f_der],
                                variables=[self.x])
        
    def optimize_X(self, X, w, b, v, F_DER):
        Rv = X@v
        Rv = torch.reshape(Rv, (Rv.size()[0], 1))
        return self.layer(X, w, b, v, Rv, F_DER)[0]

# Gain & Cost functions

In [7]:
def score(x, w, b):
    return x@w + b

def f(x, w, b, slope):
    return 0.5*cp.norm(cp.hstack([1, (slope*score(x, w, b) + 1)]), 2)

def g(x, w, b, slope):
    return 0.5*cp.norm(cp.hstack([1, (slope*score(x, w, b) - 1)]), 2)

def c(x, r, v):
    return COST*(EPSILON*cp.sum_squares(x-r) + (1-EPSILON)*cp.pos((x-r)@v)) # (1-EPSILON)*cp.sum(cp.pos(cp.multiply((x-r), v))))

def c_dpp_form(x, r, v, rv):
    return COST*(EPSILON*cp.sum_squares(x-r) + (1-EPSILON)*cp.pos(x@v-rv)) # (1-EPSILON)*cp.sum(cp.pos(cp.multiply(x, v)-rv)))

def f_derivative(x, w, b, slope):
    return 0.5*cp.multiply(slope*((slope*score(x, w, b) + 1)/cp.sqrt((slope*score(x, w, b) + 1)**2 + 1)), w)

funcs = {"f": f, "g": g, "f_derivative": f_derivative, "c": c, "c_dpp_form": c_dpp_form, "score": score}

# Data generation

In [8]:
N = 500
X, Y = gen_custom_data(N, (torch.Tensor([1, 4]), torch.Tensor([0, -2])), (torch.Tensor([1, 4]), torch.Tensor([-1, -2])))

assert(len(X[0]) == XDIM)
X, Y, Xval, Yval = split_data(X, Y, 0.5)
Xval, Yval, Xtest, Ytest = split_data(Xval, Yval, 0.5)

print("percent of positive samples: {}%".format(100 * len(Y[Y == 1]) / len(Y)))
visualize_data(X, Y)
visualize_data(Xval, Yval)
visualize_data(Xtest, Ytest)

percent of positive samples: 46.8%


<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

<IPython.core.display.Javascript object>

# Model

In [9]:
class MyStrategicModel(torch.nn.Module):
    def __init__(self, x_dim, funcs, train_slope, eval_slope, v_orig, strategic=False, flexible=False, lamb=0):
        torch.manual_seed(0)
        np.random.seed(0)
    
        super(MyStrategicModel, self).__init__()
        self.x_dim = x_dim
        self.train_slope, self.eval_slope = train_slope, eval_slope
        self.flexible = flexible
        self.strategic = strategic
        self.lamb = lamb
        
        self.w = torch.nn.parameter.Parameter(math.sqrt(1/x_dim)*(1-2*torch.rand(x_dim, dtype=torch.float64, requires_grad=True)))
        self.b = torch.nn.parameter.Parameter(torch.rand(1, dtype=torch.float64, requires_grad=True))
        self.v_orig = v_orig
        self.v = torch.clone(v_orig)
        if self.flexible:
            self.v = torch.nn.parameter.Parameter(torch.clone(v_orig), requires_grad=True)
        
        self.ccp = CCP(x_dim, funcs)
        self.delta = DELTA(x_dim, funcs)
        
    def forward(self, X, evaluation=False):
        slope = self.eval_slope if evaluation else self.train_slope
        
        if self.strategic:
            XT = self.ccp.optimize_X(X, self.w, self.b, slope, self.v)
            F_DER = self.get_f_ders(XT, slope)
            X_opt = self.delta.optimize_X(X, self.w, self.b, self.v, F_DER) # Xopt should equal to XT but we do it again for the gradients
            output = self.score(X_opt)
        else:
            output = self.score(X)        
        
        return output
    
    def optimize_X(self, X, evaluation=True):
        slope = self.eval_slope if evaluation else self.train_slope
        return self.ccp.optimize_X(X, self.w, self.b, slope, self.v)
    
    def score(self, x):
        return x@self.w + self.b
    
    def get_f_ders(self, XT, slope):
        return torch.stack([0.5*slope*((slope*self.score(xt) + 1)/torch.sqrt((slope*self.score(xt) + 1)**2 + 1))*self.w for xt in XT])

    def evaluate(self, X, Y):
        Y_pred = torch.sign(self.forward(X, evaluation=True))
        num = len(Y)
        temp = Y - Y_pred
        acc = len(temp[temp == 0])*1./num        
        return acc
    
    def loss(self, Y, Y_pred):
        if self.flexible:
            return torch.mean(torch.clamp(1 - Y_pred * Y, min=0)) + self.lamb*torch.abs(torch.norm(self.v)-torch.norm(self.v_orig)) # self.lamb*torch.abs(torch.sum(self.v) - torch.sum(self.v_orig))
        else:
            return torch.mean(torch.clamp(1 - Y_pred * Y, min=0))
    
    def save_model(self, X, Y, Xval, Yval, train_errors, val_errors, train_losses, val_losses, info, path, comment=None):
        if comment is not None:
            path += "_____" + comment
            
        filename = path + "/model.pt"
        if not os.path.exists(os.path.dirname(filename)):
            os.makedirs(os.path.dirname(filename))
        torch.save(self.state_dict(), filename)
        
        pd.DataFrame(X.numpy()).to_csv(path + '/X.csv')
        pd.DataFrame(Y.numpy()).to_csv(path + '/Y.csv')
        pd.DataFrame(Xval.numpy()).to_csv(path + '/Xval.csv')
        pd.DataFrame(Yval.numpy()).to_csv(path + '/Yval.csv')
        
        pd.DataFrame(np.array(train_errors)).to_csv(path + '/train_errors.csv')
        pd.DataFrame(np.array(val_errors)).to_csv(path + '/val_errors.csv')
        pd.DataFrame(np.array(train_losses)).to_csv(path + '/train_losses.csv')
        pd.DataFrame(np.array(val_losses)).to_csv(path + '/val_losses.csv')
        
        with open(path + "/info.txt", "w") as f:
            f.write(info)
    
    def load_model(self, filename):
        self.load_state_dict(torch.load(filename))
        self.eval()
    
    def fit(self, X, Y, Xval, Yval, opt, opt_kwargs={"lr":1e-3}, batch_size=128, epochs=100, verbose=False, callback=None, calc_train_errors=False, comment=None):
        train_dset = TensorDataset(X, Y)
        train_loader = DataLoader(train_dset, batch_size=batch_size, shuffle=True)
        opt = opt(self.parameters(), **opt_kwargs)

        train_losses = []
        val_losses = []
        train_errors = []
        val_errors = []
        
        best_val_error = 1
        consecutive_no_improvement = 0
        now = datetime.now()
        path = "C:/Users/sagil/Desktop/nir project/models/flexability/" + now.strftime("%d-%m-%Y_%H-%M-%S")

        total_time = time.time()
        for epoch in range(epochs):
            print(self.v)
            t1 = time.time()
            batch = 1
            train_losses.append([])
            train_errors.append([])
            for Xbatch, Ybatch in train_loader:
                try:
                    opt.zero_grad()
                    Ybatch_pred = self.forward(Xbatch)
                    l = self.loss(Ybatch_pred, Ybatch)
                    l.backward()
                    opt.step()
                    train_losses[-1].append(l.item())
                    if calc_train_errors:
                        with torch.no_grad():
                            e = self.evaluate(Xbatch, Ybatch)
                            train_errors[-1].append(1-e)
                    if verbose:
                        print("batch %03d / %03d | loss: %3.5f" %
                              (batch, len(train_loader), np.mean(train_losses[-1])))
                    batch += 1
                    if callback is not None:
                        callback()
                except:
                    print("failed")

            with torch.no_grad():
                try:
                    Yval_pred = self.forward(Xval)
                    val_loss = self.loss(Yval_pred, Yval).item()
                    val_losses.append(val_loss)
                    val_error = 1-self.evaluate(Xval, Yval)
                    val_errors.append(val_error)
                    if val_error < best_val_error:
                        consecutive_no_improvement = 0
                        best_val_error = val_error
                        if self.strategic:
                            info = "training time in seconds: {}\nepoch: {}\nbatch size: {}\ntrain slope: {}\neval slope: {}\nlearning rate: {}\nvalidation loss: {}\nvalidation error: {}\n".format(
                            time.time()-total_time, epoch, batch_size, self.train_slope, self.eval_slope, opt_kwargs["lr"], val_loss, val_error)
                            self.save_model(X, Y, Xval, Yval, train_errors, val_errors, train_losses, val_losses, info, path, comment)
                            print("model saved!")
                    else:
                        consecutive_no_improvement += 1
                        if consecutive_no_improvement >= 10:
                            break
                except:
                    print("failed")
                    
            t2 = time.time()
            if verbose:
                print("----- epoch %03d / %03d | time: %03d sec | loss: %3.5f | err: %3.5f" % (epoch + 1, epochs, t2-t1, val_losses[-1], val_errors[-1]))
        print("training time: {} seconds".format(time.time()-total_time)) 
        return train_errors, val_errors, train_losses, val_losses

# Train

In [10]:
EPOCHS = 15
BATCH_SIZE = 16
LAMBDA = 0.1

x_dim = XDIM
v_orig = torch.Tensor([0.6, 0.8])


# non-strategic classification
print("---------- training non-strategically----------")
non_strategic_model = MyStrategicModel(x_dim, funcs, TRAIN_SLOPE, EVAL_SLOPE, v_orig, strategic=False, flexible=False)

fit_res_non_strategic = non_strategic_model.fit(X, Y, Xval, Yval,
                                opt=torch.optim.Adam, opt_kwargs={"lr": 5*(1e-2)},
                                batch_size=BATCH_SIZE, epochs=EPOCHS, verbose=True, calc_train_errors=False)

# strategic classification, flexible
print("---------- training strategically----------")
strategic_model_flex = MyStrategicModel(x_dim, funcs, TRAIN_SLOPE, EVAL_SLOPE, v_orig, strategic=True, flexible=True, lamb=LAMBDA)

fit_res_strategic_flex = strategic_model_flex.fit(X, Y, Xval, Yval,
                                opt=torch.optim.Adam, opt_kwargs={"lr": 5*(1e-2)},
                                batch_size=BATCH_SIZE, epochs=EPOCHS, verbose=True, calc_train_errors=False,
                                comment="flexible")
print("------", strategic_model_flex.v)

# strategic classification, not flexible
print("---------- training strategically----------")
strategic_model_not_flex = MyStrategicModel(x_dim, funcs, TRAIN_SLOPE, EVAL_SLOPE, v_orig, strategic=True, flexible=False)

fit_res_strategic_not_flex = strategic_model_not_flex.fit(X, Y, Xval, Yval,
                                opt=torch.optim.Adam, opt_kwargs={"lr": 5*(1e-2)},
                                batch_size=BATCH_SIZE, epochs=EPOCHS, verbose=True, calc_train_errors=False,
                                comment="fixed")
print("------", strategic_model_not_flex.v)

---------- training non-strategically----------
tensor([0.6000, 0.8000])
batch 001 / 016 | loss: 1.58033
batch 002 / 016 | loss: 1.56733
batch 003 / 016 | loss: 1.49148
batch 004 / 016 | loss: 1.39701
batch 005 / 016 | loss: 1.33940
batch 006 / 016 | loss: 1.32806
batch 007 / 016 | loss: 1.31961
batch 008 / 016 | loss: 1.31627
batch 009 / 016 | loss: 1.29143
batch 010 / 016 | loss: 1.26842
batch 011 / 016 | loss: 1.25615
batch 012 / 016 | loss: 1.23117
batch 013 / 016 | loss: 1.21370
batch 014 / 016 | loss: 1.19529
batch 015 / 016 | loss: 1.17921
batch 016 / 016 | loss: 1.16688
----- epoch 001 / 015 | time: 000 sec | loss: 0.94783 | err: 0.45600
tensor([0.6000, 0.8000])
batch 001 / 016 | loss: 0.85308
batch 002 / 016 | loss: 0.77906
batch 003 / 016 | loss: 0.76852
batch 004 / 016 | loss: 0.77840
batch 005 / 016 | loss: 0.77371
batch 006 / 016 | loss: 0.78573
batch 007 / 016 | loss: 0.79217
batch 008 / 016 | loss: 0.77606
batch 009 / 016 | loss: 0.77154
batch 010 / 016 | loss: 0.79164
b

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.




batch 010 / 016 | loss: 0.18436
batch 011 / 016 | loss: 0.17608
batch 012 / 016 | loss: 0.16578
batch 013 / 016 | loss: 0.17294
batch 014 / 016 | loss: 0.18416
batch 015 / 016 | loss: 0.18161
batch 016 / 016 | loss: 0.17401
----- epoch 007 / 015 | time: 000 sec | loss: 0.20263 | err: 0.00800
tensor([0.6000, 0.8000])
batch 001 / 016 | loss: 0.15338
batch 002 / 016 | loss: 0.12608
batch 003 / 016 | loss: 0.11536
batch 004 / 016 | loss: 0.13544
batch 005 / 016 | loss: 0.15262
batch 006 / 016 | loss: 0.15367
batch 007 / 016 | loss: 0.14435
batch 008 / 016 | loss: 0.14052
batch 009 / 016 | loss: 0.14785
batch 010 / 016 | loss: 0.16270
batch 011 / 016 | loss: 0.15500
batch 012 / 016 | loss: 0.15095
batch 013 / 016 | loss: 0.16209
batch 014 / 016 | loss: 0.15951
batch 015 / 016 | loss: 0.16289
batch 016 / 016 | loss: 0.16078
----- epoch 008 / 015 | time: 000 sec | loss: 0.20000 | err: 0.03200
tensor([0.6000, 0.8000])
batch 001 / 016 | loss: 0.07765
batch 002 / 016 | loss: 0.09590
batch 003 /

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

	https://www.cvxpy.org/tutorial/advanced/index


batch 001 / 016 | loss: 2.54298
batch 002 / 016 | loss: 2.75454
batch 003 / 016 | loss: 2.60912
batch 004 / 016 | loss: 2.20526
batch 005 / 016 | loss: 2.09160
batch 006 / 016 | loss: 2.08020
batch 007 / 016 | loss: 2.14639
batch 008 / 016 | loss: 2.17858
batch 009 / 016 | loss: 2.10358
batch 010 / 016 | loss: 2.03448
batch 011 / 016 | loss: 1.97981
batch 012 / 016 | loss: 1.88358
batch 013 / 016 | loss: 1.80765
batch 014 / 016 | loss: 1.74952
batch 015 / 016 | loss: 1.69939
batch 016 / 016 | loss: 1.65088


  "Solution may be inaccurate. Try another solver, "


model saved!
----- epoch 001 / 015 | time: 073 sec | loss: 0.99678 | err: 0.12800
Parameter containing:
tensor([0.5863, 0.8000], requires_grad=True)
batch 001 / 016 | loss: 1.00402
batch 002 / 016 | loss: 0.96789
batch 003 / 016 | loss: 1.02363
batch 004 / 016 | loss: 1.04212
batch 005 / 016 | loss: 1.03669
batch 006 / 016 | loss: 1.05238
batch 007 / 016 | loss: 1.02629
batch 008 / 016 | loss: 1.05056
batch 009 / 016 | loss: 1.05251
batch 010 / 016 | loss: 1.02800
batch 011 / 016 | loss: 1.02050
batch 012 / 016 | loss: 1.01623
batch 013 / 016 | loss: 1.03681
batch 014 / 016 | loss: 1.01938
batch 015 / 016 | loss: 1.02089
batch 016 / 016 | loss: 0.99657
----- epoch 002 / 015 | time: 090 sec | loss: 0.98198 | err: 0.46400
Parameter containing:
tensor([0.8036, 0.6148], requires_grad=True)
batch 001 / 016 | loss: 1.33673
batch 002 / 016 | loss: 1.05775
batch 003 / 016 | loss: 0.96943
batch 004 / 016 | loss: 1.07705
batch 005 / 016 | loss: 1.09967
batch 006 / 016 | loss: 1.07276
batch 007 /

batch 008 / 016 | loss: 0.54794
batch 009 / 016 | loss: 0.54657
batch 010 / 016 | loss: 0.54169
batch 011 / 016 | loss: 0.54203
batch 012 / 016 | loss: 0.54341
batch 013 / 016 | loss: 0.54416
batch 014 / 016 | loss: 0.54354
batch 015 / 016 | loss: 0.55051
batch 016 / 016 | loss: 0.55131
----- epoch 014 / 015 | time: 071 sec | loss: 0.58246 | err: 0.14400
Parameter containing:
tensor([ 1.6036, -0.2678], requires_grad=True)
batch 001 / 016 | loss: 0.58023
batch 002 / 016 | loss: 0.56154
batch 003 / 016 | loss: 0.52424
batch 004 / 016 | loss: 0.55618
batch 005 / 016 | loss: 0.55523
batch 006 / 016 | loss: 0.54451
batch 007 / 016 | loss: 0.53825
batch 008 / 016 | loss: 0.53074
batch 009 / 016 | loss: 0.51539
batch 010 / 016 | loss: 0.52137
batch 011 / 016 | loss: 0.51767
batch 012 / 016 | loss: 0.51268
batch 013 / 016 | loss: 0.50832
batch 014 / 016 | loss: 0.51234
batch 015 / 016 | loss: 0.50134
batch 016 / 016 | loss: 0.49811
----- epoch 015 / 015 | time: 090 sec | loss: 0.55068 | err: 0

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

	https://www.cvxpy.org/tutorial/advanced/index

batch 001 / 016 | loss: 2.54298
batch 002 / 016 | loss: 2.75110
batch 003 / 016 | loss: 2.60627
batch 004 / 016 | loss: 2.20204
batch 005 / 016 | loss: 2.08783
batch 006 / 016 | loss: 2.07617
batch 007 / 016 | loss: 2.14249
batch 008 / 016 | loss: 2.17516
batch 009 / 016 | loss: 2.10039


  "Solution may be inaccurate. Try another solver, "


batch 010 / 016 | loss: 2.03149
batch 011 / 016 | loss: 1.97709
batch 012 / 016 | loss: 1.88108
batch 013 / 016 | loss: 1.80527
batch 014 / 016 | loss: 1.74725
batch 015 / 016 | loss: 1.69726
batch 016 / 016 | loss: 1.64888
model saved!
----- epoch 001 / 015 | time: 067 sec | loss: 0.99604 | err: 0.15200
tensor([0.6000, 0.8000])
batch 001 / 016 | loss: 1.00329
batch 002 / 016 | loss: 0.96777
batch 003 / 016 | loss: 1.02275
batch 004 / 016 | loss: 1.04040
batch 005 / 016 | loss: 1.03370
batch 006 / 016 | loss: 1.04819
batch 007 / 016 | loss: 1.02246
batch 008 / 016 | loss: 1.04810
batch 009 / 016 | loss: 1.05359
batch 010 / 016 | loss: 1.03386
batch 011 / 016 | loss: 1.02548
batch 012 / 016 | loss: 1.02544
batch 013 / 016 | loss: 1.02754
batch 014 / 016 | loss: 1.01853
batch 015 / 016 | loss: 1.01516
batch 016 / 016 | loss: 0.99049
----- epoch 002 / 015 | time: 085 sec | loss: 0.94165 | err: 0.46400
tensor([0.6000, 0.8000])
batch 001 / 016 | loss: 1.28872
batch 002 / 016 | loss: 1.04268



batch 004 / 016 | loss: 0.90377
batch 005 / 016 | loss: 0.93057
batch 006 / 016 | loss: 0.98517
batch 007 / 016 | loss: 0.96848
batch 008 / 016 | loss: 0.95150
batch 009 / 016 | loss: 0.95481
batch 010 / 016 | loss: 0.94775
batch 011 / 016 | loss: 0.94917
batch 012 / 016 | loss: 0.95376
batch 013 / 016 | loss: 0.97009
batch 014 / 016 | loss: 0.97395
batch 015 / 016 | loss: 0.99434
batch 016 / 016 | loss: 1.01826
----- epoch 004 / 015 | time: 098 sec | loss: 0.91336 | err: 0.28000
tensor([0.6000, 0.8000])
batch 001 / 016 | loss: 0.90929
batch 002 / 016 | loss: 0.92156
batch 003 / 016 | loss: 0.94237
batch 004 / 016 | loss: 0.94229
batch 005 / 016 | loss: 0.91119
batch 006 / 016 | loss: 0.88017
batch 007 / 016 | loss: 0.92810
batch 008 / 016 | loss: 0.90849
batch 009 / 016 | loss: 0.89576
batch 010 / 016 | loss: 0.91348
batch 011 / 016 | loss: 0.91012
batch 012 / 016 | loss: 0.88344
batch 013 / 016 | loss: 0.88764
batch 014 / 016 | loss: 0.88978
batch 015 / 016 | loss: 0.87698
batch 016 

# Test results

In [14]:
strategic_model_flex = MyStrategicModel(x_dim, funcs, TRAIN_SLOPE, EVAL_SLOPE, v_orig, strategic=True, flexible=True, lamb=LAMBDA)
strategic_model_flex.load_model(r"C:\Users\sagil\Desktop\nir project\models\flexability\20-01-2021_15-56-32_____flexible\model.pt")

strategic_model_not_flex = MyStrategicModel(x_dim, funcs, TRAIN_SLOPE, EVAL_SLOPE, v_orig, strategic=True, flexible=False)
strategic_model_not_flex.load_model(r"C:\Users\sagil\Desktop\nir project\models\flexability\20-01-2021_16-16-16_____fixed\model.pt")

Xval_opt = non_strategic_model.optimize_X(Xval, evaluation=True)
Xval_opt_flex = strategic_model_flex.optimize_X(Xval, evaluation=True)
Xval_opt_not_flex = strategic_model_not_flex.optimize_X(Xval, evaluation=True)

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multiplication.
Using ``*`` for matrix multiplication has been deprecated since CVXPY 1.1.
    Use ``*`` for matrix-scalar and vector-scalar multiplication.
    Use ``@`` for matrix-matrix and matrix-vector multiplication.
    Use ``multiply`` for elementwise multiplication.

This use of ``*`` has resulted in matrix multi

In [15]:
print("non strategic model + non strategic data: ", non_strategic_model.evaluate(Xval, Yval))
print("non strategic model + strategic data: ", non_strategic_model.evaluate(Xval_opt, Yval))
print("flexible strategic model + strategic data: ", strategic_model_flex.evaluate(Xval, Yval))
print("fixed strategic model + strategic data: ", strategic_model_not_flex.evaluate(Xval, Yval))

  and should_run_async(code)


non strategic model + non strategic data:  0.992
non strategic model + strategic data:  0.544
flexible strategic model + strategic data:  0.984
fixed strategic model + strategic data:  0.848


In [19]:
visualize_strategic_data(Xval, Xval_opt, Yval, non_strategic_model.w, non_strategic_model.b, non_strategic_model.v, torch.zeros(1))

  and should_run_async(code)


<IPython.core.display.Javascript object>

In [23]:
print(strategic_model_not_flex.w)
visualize_strategic_data(Xval, Xval_opt_not_flex, Yval, strategic_model_not_flex.w, strategic_model_not_flex.b, strategic_model_not_flex.v, torch.zeros(1))

Parameter containing:
tensor([0.0316, 0.0060], requires_grad=True)


  and should_run_async(code)


<IPython.core.display.Javascript object>

In [22]:
print(strategic_model_flex.v)
visualize_strategic_data(Xval, Xval_opt_flex, Yval, strategic_model_flex.w, strategic_model_flex.b, strategic_model_flex.v, torch.zeros(1))

Parameter containing:
tensor([ 1.4378, -0.2290], requires_grad=True)


  and should_run_async(code)


<IPython.core.display.Javascript object>