In [2]:
import sys
sys.path

['/Users/litos/opt/anaconda3/envs/tensorflow_cpu/lib/python36.zip',
 '/Users/litos/opt/anaconda3/envs/tensorflow_cpu/lib/python3.6',
 '/Users/litos/opt/anaconda3/envs/tensorflow_cpu/lib/python3.6/lib-dynload',
 '',
 '/Users/litos/opt/anaconda3/envs/tensorflow_cpu/lib/python3.6/site-packages',
 '/Users/litos/opt/anaconda3/envs/tensorflow_cpu/lib/python3.6/site-packages/IPython/extensions',
 '/Users/litos/.ipython']

In [3]:
from gurobipy import *

from scipy.sparse import csr_matrix, load_npz, save_npz
from tqdm import tqdm
from sklearn.preprocessing import normalize
from collections import *
import datetime
import json
import pandas as pd
import time
# import yaml
import scipy.sparse as sparse
from ast import literal_eval

import numpy as np
import matplotlib.pyplot as plt
import random

from sklearn.linear_model import LinearRegression
from sklearn.preprocessing import normalize
from sklearn.linear_model import Ridge
from sklearn.utils.extmath import randomized_svd

from scipy.optimize import minimize

# Utils

In [4]:
def save_dataframe_csv(df, path, name):
    df.to_csv(path+name, index=False)


def load_dataframe_csv(path, name, index_col=None):
    return pd.read_csv(path+name, index_col=index_col)


# Load Data

In [5]:
# Load Original Data
df_train = pd.read_csv('../../data/yelp/Train.csv',encoding='latin-1')
# df_valid = pd.read_csv('../../data/yelp/Valid.csv',encoding='latin-1')
# df_test = pd.read_csv('../../data/yelp/Test.csv',encoding='latin-1')

In [6]:
keyphrases = pd.read_csv('../../data/yelp/KeyPhrases.csv')['Phrases'].tolist()
keyphrase_popularity = np.loadtxt('../data/yelp/'+'keyphrase_popularity.txt', dtype=int)

# Load U-I Data 
rtrain = load_npz("../../data/yelp/Rtrain.npz")
rvalid = load_npz("../../data/yelp/Rvalid.npz")
rtest = load_npz("../../data/yelp/Rtest.npz")

# Load user/item keyphrase data
U_K = load_npz("../../data/yelp/U_K.npz")
I_K = load_npz("../../data/yelp/I_K.npz")

# Models

In [7]:
def get_I_K(df, row_name = 'ItemIndex', shape = (3668,75)):
    rows = []
    cols = []
    vals = []
    for i in tqdm(range(df.shape[0])):
        key_vector = literal_eval(df['keyVector'][i])
        rows.extend([df[row_name][i]]*len(key_vector)) ## Item index
        cols.extend(key_vector) ## Keyword Index
        vals.extend(np.array([1]*len(key_vector)))
    return csr_matrix((vals, (rows, cols)), shape=shape)


In [8]:
# PLREC 
def inhour(elapsed):
    return time.strftime('%H:%M:%S', time.gmtime(elapsed))

def plrec(matrix_train, iteration=4, lamb=80, rank=200, seed=1):
    """
    Function used to achieve generalized projected lrec w/o item-attribute embedding
    :param matrix_train: user-item matrix with shape m*n
    :param iteration: number of power iterations in randomized svd
    :param lamb: parameter of penalty
    :param rank: latent dimension size
    :param seed: the seed of the pseudo random number generator to use when shuffling the data
    :return: prediction in sparse matrix
    """
    print ("Randomized SVD")
    start_time = time.time()
    P, sigma, Qt = randomized_svd(matrix_train,
                                  n_components=rank,
                                  n_iter=iteration,
                                  random_state=seed)

    RQ = matrix_train.dot(sparse.csc_matrix(Qt.T*np.sqrt(sigma)))

    print("Elapsed: {}".format(inhour(time.time() - start_time)))

    print ("Closed-Form Linear Optimization")
    start_time = time.time()
    pre_inv = RQ.T.dot(RQ) + lamb * sparse.identity(rank, dtype=np.float32)
    inverse = sparse.linalg.inv(pre_inv.tocsc())
    Y = inverse.dot(RQ.T).dot(matrix_train)
    print("Elapsed: {}".format(inhour(time.time() - start_time)))

    return np.array(RQ.todense()), np.array(Y.todense()), None

# def predict_vector(rating_vector, train_vector, remove_train=True):
#     dim = len(rating_vector)
#     candidate_index = np.argpartition(-rating_vector, dim-1)[:dim]
#     prediction_items = candidate_index[rating_vector[candidate_index].argsort()[::-1]]
    
#     if remove_train:
#         return np.delete(prediction_items, np.isin(prediction_items, train_vector.nonzero()[1]).nonzero()[0])
#     else:
#         return prediction_items

    
def predict_scores(matrix_U, matrix_V, bias=None,
                   penalize = False,
                   keyphrase_freq = I_K, 
                   critiqued_keyphrase = 0, 
                   matrix_Train = rtrain,
                   alpha = 0):
    prediction = matrix_U.dot(matrix_V.T)
    # Penalize
    if penalize == True:
        items_with_keyphrase = np.ravel(keyphrase_freq.T[critiqued_keyphrase].nonzero()[1])
        items_without_keyphrase = np.setdiff1d(np.arange(matrix_Train.shape[1]), items_with_keyphrase)
        prediction[items_without_keyphrase] = alpha # penalize
    
    return prediction

def predict_vector(rating_vector, train_vector, remove_train=True):
    dim = len(rating_vector)
    candidate_index = np.argpartition(-rating_vector, dim-1)[:dim]
    prediction_items = candidate_index[rating_vector[candidate_index].argsort()[::-1]]
    
    if remove_train:
        return np.delete(prediction_items, np.isin(prediction_items, train_vector.nonzero()[1]).nonzero()[0])
    else:
        return prediction_items


In [9]:
# initial Prediction
def predict_scores(matrix_U, matrix_V, bias=None,
                   penalize = False,
                   keyphrase_freq = I_K, 
                   critiqued_keyphrase = 0, 
                   matrix_Train = rtrain,
                   alpha = 0):
    
    prediction = matrix_U.dot(matrix_V.T)
    # Penalize
    if penalize == True:
        items_with_keyphrase = np.ravel(keyphrase_freq.T[critiqued_keyphrase].nonzero()[1])
        items_without_keyphrase = np.setdiff1d(np.arange(matrix_Train.shape[1]), items_with_keyphrase)
        prediction[items_without_keyphrase] = alpha # penalize
    
    return prediction


In [10]:
# Keyphrase Selection Helpers
def get_valid_keyphrases(keyphrase_freq,top_recommendations,item = None,threshold=50,mutiple_keyphrases_en = False, top_items = None):
    """
    Wrapper function to get either top 1 or top n keyphrases
    """
    if mutiple_keyphrases_en:
        top_keyphrases = []
        for item in top_items:
            top_keyphrases.extend(get_valid_keyphrases_for_one_item(keyphrase_freq,top_recommendations,item,threshold=threshold))
        return np.ravel(list(set(top_keyphrases))) # remove duplicate and reformat to np array
    else:
        return get_valid_keyphrases_for_one_item(keyphrase_freq,top_recommendations,item,threshold=threshold)

def get_valid_keyphrases_for_one_item(keyphrase_freq,top_recommendations, item,threshold=50):
    """
    Get keyphrases of item that make sense
    E.g. if the item has fewer than threshold=50 keyphrases, get all of them
    otherwise get top 50 keyphrases
    """
    keyphrase_length = len(keyphrase_freq[item].nonzero()[1])
    if keyphrase_length<threshold:
        return keyphrase_freq[item].nonzero()[1]
    else:
        keyphrases = np.ravel(keyphrase_freq[top_recommendations[0]].todense())
        top_keyphrases = np.argsort(keyphrases)[::-1][:threshold]
        return top_keyphrases
    
# For keyphrase selecting method # 3 "diff" 
def get_item_keyphrase_freq(keyphrase_freq,item):
    """
    Get item's keyphrase frequency 
    """
    count = keyphrase_freq[item].todense()
    return np.ravel(count/(np.sum(count)+0.001))

def get_all_item_keyphrase_freq(item_keyphrase_freq = I_K):
    res = []
    num_items = item_keyphrase_freq.shape[0]
    for item in range(num_items):
        res.append(np.ravel(get_item_keyphrase_freq(item_keyphrase_freq,item)))
    return np.array(res)

def get_keyphrase_popularity(df,keyphrases):
    """
    Get keyphrase popularity (count) from dataframe
    """
    keyphrase_popularity = np.zeros(len(keyphrases)) #initialize
    for i in range(len(df)):
        keyphrase_vector = literal_eval(df['keyVector'][i])
        keyphrase_popularity[keyphrase_vector] += 1 # count
    return keyphrase_popularity

In [11]:
all_item_keyphrase_freq = get_all_item_keyphrase_freq()

In [12]:
# One hot encoding of critiquing
def get_critiqued_UK(user_keyphrase_frequency,user_index,critiqued_keyphrase):
    """
    user_keyphrase_frequency is the U_K matrix (csr sparse matrix)
    return the one-hot encoding of the critique
    """
    U_K_cp = user_keyphrase_frequency.copy()
    U_K_cp[user_index] = 0
    U_K_cp[user_index,critiqued_keyphrase] = 1
    return U_K_cp

def project_one_hot_encoding(reg, user_keyphrase_frequency,user_index = 0,critiqued_keyphrase = 0, normalize_en = True):
    """
    Return the projection on user_sim space from one-hot encoding of critiqued keyphrase
    The res[user_index] should be target embedding row
    """
    critiqued_matrix = get_critiqued_UK(user_keyphrase_frequency, user_index, critiqued_keyphrase)
    res = reg.predict(critiqued_matrix)
    if normalize_en:
        res = normalize((res))
    return res

In [13]:
# Upper bound method 
def get_all_affected_items(wanted_keyphrases,keyphrase_freq):
    res = []
    for keyphrase in wanted_keyphrases:
        items = np.ravel(keyphrase_freq.T[keyphrase].nonzero()[1])
        res.extend(items)
    return np.array(list(set(res)))
    
def select_only_wanted_keyphrase(top_recommendations, wanted_keyphrases, keyphrase_freq, matrix_Train = rtrain):
    all_items_with_keyphrases = get_all_affected_items(wanted_keyphrases,keyphrase_freq)
    affected_items = np.setdiff1d(np.arange(matrix_Train.shape[1]), all_items_with_keyphrases) # Get all other keyphrases
    top_recommendations[~np.in1d(top_recommendations, affected_items)]
    return top_recommendations

def pruning(prediction_score, 
           wanted_keyphrases_random, 
           top_recommendations, 
           keyphrase_freq, 
           matrix_Train = rtrain,
           alpha = 0):
    items_with_keyphrase = get_all_affected_items(wanted_keyphrases_random, keyphrase_freq)
    #Return the unique values in ar1 that are not in ar2.
    items_without_keyphrase = np.setdiff1d(np.arange(matrix_Train.shape[1]), items_with_keyphrase)
#     print (items_without_keyphrase)
    print (sum(prediction_score[items_without_keyphrase]))
    score = np.copy(prediction_score)
    score[items_without_keyphrase] = alpha # penalize
    return score

# Utils

In [14]:
# Utility function for getting restaurant info from ItemIndex
def get_business_df(path = "../../data/yelp/business.json" ):
    with open(path,encoding="utf8") as json_file:
        data = json_file.readlines()
        data = list(map(json.loads, data))
    df = pd.DataFrame(data)
    
    return df

def get_restaurant_info(business_df, business_id, name = True, review_count = True, stars = True ):
    output_list = {}
    row_idx = int(business_df.index[business_df['business_id'] == business_id].tolist()[0])
    if name == True:
        output_list['name'] = business_df['name'][row_idx].encode('utf-8').strip()
    if review_count == True:
        output_list['review_count'] = business_df['review_count'][row_idx]
    if stars == True:
        output_list['stars'] = business_df['stars'][row_idx] 
    return output_list

# def get_businessid_from_Itemindex(ItemIndex_list, itemindex):
#     return ItemIndex_list['business_id'].tolist()[itemindex]

def get_restaurant_name(df_train, business_df, ItemIndex):
    rows = np.where(df_train['ItemIndex'] == ItemIndex)
    if len(rows)!= 0:
        business_id = df_train.loc[rows[0][0]]['business_id']
        item_info = get_restaurant_info(business_df, business_id)
        return item_info['name']
    return "NOT_FOUND"

# Evaluation 

In [15]:
# Evluation 
def recallk(vector_true_dense, hits, **unused):
    hits = len(hits.nonzero()[0])
    return float(hits)/len(vector_true_dense)

def precisionk(vector_predict, hits, **unused):
    hits = len(hits.nonzero()[0])
    return float(hits)/len(vector_predict)


def average_precisionk(vector_predict, hits, **unused):
    precisions = np.cumsum(hits, dtype=np.float32)/range(1, len(vector_predict)+1)
    return np.mean(precisions)


def r_precision(vector_true_dense, vector_predict, **unused):
    vector_predict_short = vector_predict[:len(vector_true_dense)]
    hits = len(np.isin(vector_predict_short, vector_true_dense).nonzero()[0])
    return float(hits)/len(vector_true_dense)


def _dcg_support(size):
    arr = np.arange(1, size+1)+1
    return 1./np.log2(arr)


def ndcg(vector_true_dense, vector_predict, hits):
    idcg = np.sum(_dcg_support(len(vector_true_dense)))
    dcg_base = _dcg_support(len(vector_predict))
    dcg_base[np.logical_not(hits)] = 0
    dcg = np.sum(dcg_base)
    return dcg/idcg


def click(hits, **unused):
    first_hit = next((i for i, x in enumerate(hits) if x), None)
    if first_hit is None:
        return 5
    else:
        return first_hit/10


def evaluate(matrix_Predict, matrix_Test, metric_names =['R-Precision', 'NDCG', 'Precision', 'Recall', 'MAP'], atK = [5, 10, 15, 20, 50], analytical=False):
    """
    :param matrix_U: Latent representations of users, for LRecs it is RQ, for ALSs it is U
    :param matrix_V: Latent representations of items, for LRecs it is Q, for ALSs it is V
    :param matrix_Train: Rating matrix for training, features.
    :param matrix_Test: Rating matrix for evaluation, true labels.
    :param k: Top K retrieval
    :param metric_names: Evaluation metrics
    :return:
    """
    global_metrics = {
        "R-Precision": r_precision,
        "NDCG": ndcg,
        "Clicks": click
    }

    local_metrics = {
        "Precision": precisionk,
        "Recall": recallk,
        "MAP": average_precisionk
    }

    output = dict()

    num_users = matrix_Predict.shape[0]

    for k in atK:

        local_metric_names = list(set(metric_names).intersection(local_metrics.keys()))
        results = {name: [] for name in local_metric_names}
        topK_Predict = matrix_Predict[:, :k]

        for user_index in tqdm(range(topK_Predict.shape[0])):
            vector_predict = topK_Predict[user_index]
            if len(vector_predict.nonzero()[0]) > 0:
                vector_true = matrix_Test[user_index]
                vector_true_dense = vector_true.nonzero()[1]
                hits = np.isin(vector_predict, vector_true_dense)

                if vector_true_dense.size > 0:
                    for name in local_metric_names:
                        results[name].append(local_metrics[name](vector_true_dense=vector_true_dense,
                                                                 vector_predict=vector_predict,
                                                                 hits=hits))

        results_summary = dict()
        if analytical:
            for name in local_metric_names:
                results_summary['{0}@{1}'.format(name, k)] = results[name]
        else:
            for name in local_metric_names:
                results_summary['{0}@{1}'.format(name, k)] = (np.average(results[name]),
                                                              1.96*np.std(results[name])/np.sqrt(num_users))
        output.update(results_summary)

    global_metric_names = list(set(metric_names).intersection(global_metrics.keys()))
    results = {name: [] for name in global_metric_names}

    topK_Predict = matrix_Predict[:]

    for user_index in tqdm(range(topK_Predict.shape[0])):
        vector_predict = topK_Predict[user_index]

        if len(vector_predict.nonzero()[0]) > 0:
            vector_true = matrix_Test[user_index]
            vector_true_dense = vector_true.nonzero()[1]
            hits = np.isin(vector_predict, vector_true_dense)

            # if user_index == 1:
            #     import ipdb;
            #     ipdb.set_trace()

            if vector_true_dense.size > 0:
                for name in global_metric_names:
                    results[name].append(global_metrics[name](vector_true_dense=vector_true_dense,
                                                              vector_predict=vector_predict,
                                                              hits=hits))

    results_summary = dict()
    if analytical:
        for name in global_metric_names:
            results_summary[name] = results[name]
    else:
        for name in global_metric_names:
            results_summary[name] = (np.average(results[name]), 1.96*np.std(results[name])/np.sqrt(num_users))
    output.update(results_summary)

    return output



# Critiquing Pipline

In [16]:
business_df = get_business_df()

In [17]:
keyphrase_popularity = np.loadtxt('../data/yelp/'+'keyphrase_popularity.txt', dtype=int)

In [18]:
Y, RQt, Bias = plrec(rtrain,
                    iteration = 10,
                    lamb = 200,
                    rank = 200)
RQ = RQt.T
reg = LinearRegression().fit(normalize(U_K), Y)

Randomized SVD
Elapsed: 00:00:00
Closed-Form Linear Optimization
Elapsed: 00:00:00


In [19]:
# Set up dataframe 

# post_ranki is post rank with different lambda ratio for combining pre-post User similarity matrix 

columns = ['user_id', 'target_item', 'item_name', 'iter', 'pre_rank', 
           'top_prediction_item_name',
           'post_rank_random_all',
           'post_rank_random_upper',
           'random_scores',
           'post_rank_pop_all',
           'post_rank_pop_upper',
           'pop_scores',
           'post_rank_diff_all',
           'post_rank_diff_upper',
           'diff_scores',
           'critiqued_keyphrase_random',
           'keyphrase_name_random',
           'critiqued_keyphrase_pop',
           'keyphrase_name_pop',
           'critiqued_keyphrase_diff',
           'keyphrase_name_diff',
           'num_existing_keyphrases',
           'pure_pruning_rank'] 
df = pd.DataFrame(columns=columns)
row = {}

## Average

In [48]:
def Average(initial_prediction_u, keyphrase_freq, affected_items, unaffected_items, num_keyphrases, query, test_user, item_latent, reg, all_equal = True):
    critiqued_vector = np.zeros(keyphrase_freq.shape[1])
    
    for q in query:
#         critiqued_vector[q] = 1
        critiqued_vector[q] = max(keyphrase_freq[test_user , q],1)
        
    num_critiques = len(query)
    
    # Get item latent for updating prediction
    W2 = reg.coef_
    W = item_latent.dot(W2)
    
    optimal_lambda = 1 # weight all critiquing equally
    
    lambdas = [optimal_lambda]*num_critiques
    
    # Record lambda values 
    for k in range(num_critiques):
        critiqued_vector[query[k]] *= optimal_lambda

    # Get rating score
    critique_score = predict_scores(matrix_U=reg.predict(critiqued_vector.reshape(1, -1)),
                                    matrix_V=item_latent)
    new_prediction = initial_prediction_u + critique_score.flatten()
    
#     if all_equal:
#         # weight initial and each critiquing equally 
#         new_prediction = initial_prediction_u/(num_critiques) + critique_score.flatten()
#     else:
#         # weight intial and combined critiquing equally
#         new_prediction = initial_prediction_u + critique_score.flatten() 
# #     print (len(new_prediction))
    return new_prediction, lambdas   


## Rating Objective

In [98]:
def LP1SimplifiedOptimize(initial_prediction_u, keyphrase_freq, affected_items, unaffected_items, num_keyphrases, 
                          query, test_user, item_latent, reg):

    critiqued_vector = np.zeros(keyphrase_freq.shape[1])

    for q in query:
#         critiqued_vector[q] = -keyphrase_freq[test_user][q]
        critiqued_vector[q] = max(keyphrase_freq[test_user , q],1)

    num_critiques = len(query)
    
    W2 = reg.coef_
    W = item_latent.dot(W2)

    num_affected_items = len(affected_items)
    num_unaffected_items = len(unaffected_items)

    start_time = time.time()

    # Model
    m = Model("LP1Simplified")
    m.setParam('OutputFlag', 0)
    # Assignment variables
    lambs = []

    for k in range(num_critiques):
        lambs.append(m.addVar(lb=-1,
                              ub=1,
                              vtype=GRB.CONTINUOUS,
                              name="lamb%d" % query[k]))
        
    print ('affected_items', affected_items)
    print (int(affected_items[0]))
    print ('unaffected_items', unaffected_items)
    print (int(unaffected_items[0]))
    
#     m.setObjective( quicksum(initial_prediction_u[unaffected_item] * num_affected_items + quicksum(lambs[i] * critiqued_vector[query[i]] * W[unaffected_item][query[i]] * num_affected_items for i in range(num_critiques) ) for unaffected_item in unaffected_items - 
#                     quicksum(initial_prediction_u[affected_item] * num_unaffected_items + quicksum(lambs[i] * critiqued_vector[query[i]] * W[affected_item][query[i]] * num_unaffected_items for i in range(num_critiques) ) for affected_item in affected_items)), GRB.MINIMIZE)
    m.setObjective(quicksum(initial_prediction_u[affected_item] * num_unaffected_items + quicksum(lambs[k] * critiqued_vector[query[k]] * W[affected_item][query[k]] * num_unaffected_items for k in range(num_critiques)) for affected_item in affected_items) - quicksum(initial_prediction_u[unaffected_item] * num_affected_items + quicksum(lambs[k] * critiqued_vector[query[k]] * W[unaffected_item][query[k]] * num_affected_items for k in range(num_critiques)) for unaffected_item in unaffected_items), GRB.MAXIMIZE)

    # Optimize
    m.optimize()

#     print("Elapsed: {}".format(inhour(time.time() - start_time)))

    lambdas = []
    for k in range(num_critiques):
        optimal_lambda = m.getVars()[k].X
        lambdas.append(optimal_lambda)
        critiqued_vector[query[k]] *= optimal_lambda

    critique_score = predict_scores(matrix_U=reg.predict(critiqued_vector.reshape(1, -1)),
                                    matrix_V=item_latent)

    new_prediction = initial_prediction_u + critique_score.flatten()

    return new_prediction, lambdas


## RankSVM Objective

In [33]:
#### See https://www.overleaf.com/read/wwftdhpcmxnx
#### For the RankSVM math

def rankSVM(initial_prediction_u, keyphrase_freq, affected_items, unaffected_items, num_keyphrases, 
            query, test_user, item_latent, reg, user_latent_embedding, item_keyphrase_freq = I_K):
    critiques = query # fix this variable name later
    
#     critiqued_vector = np.zeros(keyphrase_freq.shape[1])
    
#     for c in critiques:
# #         critiqued_vector[q] = 1 # set critiqued/boosted keyphrase to 1
#         critiqued_vector[c] = max(keyphrase_freq[test_user , c],1)
# #         print ('critiqued_vector setting: ',critiqued_vector[q])
#     print ('affected items, ',affected_items)
#     print ('unaffected items, ',unaffected_items)
    
    num_critiques = len(critiques)

    W2 = reg.coef_
    W = item_latent.dot(W2)

    num_affected_items = len(affected_items)
    num_unaffected_items = len(unaffected_items)

    start_time = time.time()

    # Model
    m = Model("LP2RankSVM")
    m.setParam('OutputFlag', 0)
    
    # Assignment variables
    thetas = []
    us = []
    xis = []
    # weight thetas
    for k in range(num_critiques + 1):
        thetas.append(m.addVar(lb=-1,
                              ub=1,
                              vtype=GRB.CONTINUOUS,
                              name="theta%d" % k))
    thetas = np.array(thetas)
    # dummy variable u for absolute theta
    for k in range(num_critiques + 1):
        us.append(m.addVar(vtype=GRB.CONTINUOUS,
                          name="u%d" % k))
        
    # slack variables xi
    for i in range(num_affected_items):
        for j in range(num_unaffected_items):
            xis.append(m.addVar(lb = 0, 
                                vtype = GRB.CONTINUOUS,
                                name = "xi_%d_%d" % (i,j) ))
      
    ## constraints
    # constraints for dummy variable u's
    for k in range(num_critiques+1):
        m.addConstr(us[k] >= thetas[k])
        m.addConstr(us[k] >= -thetas[k])
        
    
    ## Pre-calculate critique embedding
    u_i = Y[test_user]
    phi_js = []
    phi_jprimes = []
    k_cis = []
    
    user_latent_embedding = np.array(user_latent_embedding)
#     print ('user latent embedding shape: ', user_latent_embedding.shape)
    # constraints for rankSVM 
    for j in range(num_affected_items):
        for j_ in range(num_unaffected_items):
            m.addConstr( thetas.dot(user_latent_embedding.dot(RQ[affected_items[j]])) >= thetas.dot(user_latent_embedding.dot(RQ[unaffected_items[j_]])) + 1 - xis[j*num_affected_items + j_], name = "constraints%d_%d" % (j,j_))
#             print ('item j embedding :',user_latent_embedding.dot(RQ[j]) )
#             print ('item j_ embedding:',user_latent_embedding.dot(RQ[j_]) )
    lamb = 5 #regularization parameter (trading-off margin size against training error
    m.setObjective(quicksum(us) + lamb * quicksum(xis), GRB.MINIMIZE)
                
    # Optimize
    m.optimize()

#     print("Elapsed: {}".format(inhour(time.time() - start_time)))

    thetas = []
    for k in range(num_critiques+1):
        optimal_theta = m.getVarByName("theta%d" % k).X
        thetas.append(optimal_theta)
        
#     print ('optimal thetas: ',thetas)


    critiqued_vector = np.zeros(keyphrase_freq.shape[1])
    
    # Combine weights to critiqued vector
    for c in critiques:
#         critiqued_vector[q] = 1 # set critiqued/boosted keyphrase to 1
        critiqued_vector[c] = max(keyphrase_freq[test_user , c],1)
    for k in range(num_critiques):
        critiqued_vector[critiques[k]] *= thetas[k+1]
    
    # Get rating score
    critique_score = predict_scores(matrix_U=reg.predict(critiqued_vector.reshape(1, -1)),
                                    matrix_V=item_latent)
    new_prediction = thetas[0]*initial_prediction_u + critique_score.flatten()
    
    return new_prediction, thetas

In [41]:
#### See https://www.overleaf.com/read/wwftdhpcmxnx
#### For the RankSVM math

def rankSVM2(initial_prediction_u, keyphrase_freq, affected_items, unaffected_items, num_keyphrases, 
            query, test_user, item_latent, reg, user_latent_embedding, item_keyphrase_freq = I_K, lamb = [5,5]):
    critiques = query # fix this variable name later

    # pre calculate some value
    num_critiques = len(critiques)

    num_affected_items = len(affected_items)
    num_unaffected_items = len(unaffected_items)

#     start_time = time.time()

    # Model
    m = Model("LP2RankSVM2")
    m.setParam('OutputFlag', 0) # set to 1 for outputing details
    
    # Assignment variables
    thetas = []
    us = []
    xi_pos = []
    xi_neg = []
    # weight thetas
    for k in range(num_critiques + 1):
        thetas.append(m.addVar(lb=-1,
                              ub=1,
                              vtype=GRB.CONTINUOUS,
                              name="theta%d" % k))
    thetas = np.array(thetas)
    
    # dummy variable u for absolute theta
    for k in range(num_critiques + 1):
        us.append(m.addVar(vtype=GRB.CONTINUOUS,
                          name="u%d" % k))
        
    # slack variables xi
    for i in range(num_affected_items):
        xi_pos.append(m.addVar(lb = 0, 
                                vtype = GRB.CONTINUOUS,
                                name = "xi_pos%d" % i ))
    for i in range(num_unaffected_items):
        xi_neg.append(m.addVar(lb = 0, 
                                vtype = GRB.CONTINUOUS,
                                name = "xi_neg%d" % i ))
        
    ## constraints
    # constraints for dummy variable u's
    for k in range(num_critiques+1):
        m.addConstr(us[k] >= thetas[k])
        m.addConstr(us[k] >= -thetas[k])
 
    user_latent_embedding = np.array(user_latent_embedding)
    
    # Affected items rank higher
    for j in range(num_affected_items):
        m.addConstr( thetas.dot(user_latent_embedding.dot(RQ[affected_items[j]])) >= initial_prediction_u[affected_items[j]] + 1 - xi_pos[j], name = "pos_constraint%d" % j )
    
    # Unaffected items rank lower
    for j in range(num_unaffected_items):
        m.addConstr( initial_prediction_u[unaffected_items[j]] - thetas.dot(user_latent_embedding.dot(RQ[unaffected_items[j]])) >=  1 - xi_neg[j], name = "neg_constraint%d" % j )
            
    # objective
    lamb1 = lamb[0] #regularization for trading-off margin size against training error
    lamb2 = lamb[1] #regularization for trading-off deviation from Averaging 

    m.setObjective(quicksum(us) + lamb1 * (quicksum(xi_pos)+quicksum(xi_neg)) + lamb2 * quicksum( [( 1- theta) for theta in thetas]), GRB.MINIMIZE) 
    

                
    # Optimize
    m.optimize()

    # Save optimal thetas
    thetas = []
    for k in range(num_critiques+1):
        optimal_theta = m.getVarByName("theta%d" % k).X
        thetas.append(optimal_theta)
        
    critiqued_vector = np.zeros(keyphrase_freq.shape[1])
    
    # Combine weights to critiqued vector
    for c in critiques:
#         critiqued_vector[c] = 1 # set critiqued/boosted keyphrase to 1
        critiqued_vector[c] = max(keyphrase_freq[test_user , c],1)
    
    for k in range(num_critiques):
        critiqued_vector[critiques[k]] *= thetas[k+1]
    
    # Get rating score
    critique_score = predict_scores(matrix_U=reg.predict(critiqued_vector.reshape(1, -1)),
                                    matrix_V=item_latent)
    new_prediction = thetas[0]*initial_prediction_u/num_critiques + critique_score.flatten()
#     new_prediction = initial_prediction_u/num_critiques + critique_score.flatten()
#     new_prediction = critique_score.flatten()
    
    return new_prediction, thetas

In [60]:
#### Changes minimization objective compares to ranksvm2

def rankSVM3(initial_prediction_u, keyphrase_freq, affected_items, unaffected_items, num_keyphrases, 
            query, test_user, item_latent, reg, user_latent_embedding, item_keyphrase_freq = I_K, lamb = [5,5]):
    critiques = query # fix this variable name later

    # pre calculate some value
    num_critiques = len(critiques)

    num_affected_items = len(affected_items)
    num_unaffected_items = len(unaffected_items)

#     start_time = time.time()

    # Model
    m = Model("LP2RankSVM2")
    m.setParam('OutputFlag', 0) # set to 1 for outputing details
    
    # Assignment variables
    thetas = []
    us = []
    xi_pos = []
    xi_neg = []
    # weight thetas
    for k in range(num_critiques + 1):
        thetas.append(m.addVar(lb=-2,
                              ub=2,
                              vtype=GRB.CONTINUOUS,
                              name="theta%d" % k))
    thetas = np.array(thetas)
    
    # dummy variable u for absolute theta
    for k in range(num_critiques + 1):
        us.append(m.addVar(vtype=GRB.CONTINUOUS,
                          name="u%d" % k))
        
    # slack variables xi
    for i in range(num_affected_items):
        xi_pos.append(m.addVar(lb = 0, 
                                vtype = GRB.CONTINUOUS,
                                name = "xi_pos%d" % i ))
    for i in range(num_unaffected_items):
        xi_neg.append(m.addVar(lb = 0, 
                                vtype = GRB.CONTINUOUS,
                                name = "xi_neg%d" % i ))
        
    ## constraints
    # constraints for dummy variable u's
    for k in range(num_critiques+1):
        m.addConstr(us[k] >= thetas[k] - 1)
        m.addConstr(us[k] >= 1 - thetas[k])
 
    user_latent_embedding = np.array(user_latent_embedding)
    
    # Affected items rank higher
    for j in range(num_affected_items):
        m.addConstr( thetas.dot(user_latent_embedding.dot(RQ[affected_items[j]])) >= initial_prediction_u[affected_items[j]] + 1 - xi_pos[j], name = "pos_constraint%d" % j )
    
    # Unaffected items rank lower
    for j in range(num_unaffected_items):
        m.addConstr( initial_prediction_u[unaffected_items[j]] - thetas.dot(user_latent_embedding.dot(RQ[unaffected_items[j]])) >=  1 - xi_neg[j], name = "neg_constraint%d" % j )
            
    # objective
    lamb1 = lamb[0] #regularization for trading-off margin size against training error
    lamb2 = lamb[1] #regularization for trading-off deviation from Averaging 

    m.setObjective(lamb1* quicksum(us) + lamb2 * (quicksum(xi_pos)+quicksum(xi_neg)), GRB.MINIMIZE) 
    
                
    # Optimize
    m.optimize()

    # Save optimal thetas
    thetas = []
    for k in range(num_critiques+1):
        optimal_theta = m.getVarByName("theta%d" % k).X
        thetas.append(optimal_theta)
        
    critiqued_vector = np.zeros(keyphrase_freq.shape[1])
    
    # Combine weights to critiqued vector
    for c in critiques:
#         critiqued_vector[c] = 1 # set critiqued/boosted keyphrase to 1
        critiqued_vector[c] = max(keyphrase_freq[test_user , c],1)
    
    for k in range(num_critiques):
        critiqued_vector[critiques[k]] *= thetas[k+1]
    
    # Get rating score
    critique_score = predict_scores(matrix_U=reg.predict(critiqued_vector.reshape(1, -1)),
                                    matrix_V=item_latent)
    new_prediction = thetas[0]*initial_prediction_u/num_critiques + critique_score.flatten()
#     new_prediction = initial_prediction_u/num_critiques + critique_score.flatten()
#     new_prediction = critique_score.flatten()
    
    return new_prediction, thetas

# Main

In [89]:
class LP1Simplified(object):
    def __init__(self, keyphrase_freq, item_keyphrase_freq, row, matrix_Train, matrix_Test, test_users,
                 target_ranks, num_items_sampled, num_keyphrases, df,
                 max_iteration_threshold, keyphrase_popularity, dataset_name,
                 model, parameters_row, keyphrases_names, keyphrase_selection_method, max_wanted_keyphrase, lamb, **unused):
        self.keyphrase_freq = keyphrase_freq
        self.item_keyphrase_freq = item_keyphrase_freq
        self.row = row
        self.matrix_Train = matrix_Train
        self.num_users, self.num_items = matrix_Train.shape
        self.matrix_Test = matrix_Test
        self.test_users = test_users
        self.target_ranks = target_ranks
        self.num_items_sampled = num_items_sampled
        self.num_keyphrases = num_keyphrases
        self.df = df
        self.max_iteration_threshold = max_iteration_threshold
        self.keyphrase_popularity = keyphrase_popularity
        self.dataset_name = dataset_name
        self.model = model
        self.parameters_row = parameters_row
        self.keyphrase_selection_method = keyphrase_selection_method
        self.max_wanted_keyphrase = max_wanted_keyphrase
        
        self.lamb = lamb
        self.keyphrases_names = keyphrases_names

    def start_critiquing(self):
#         self.get_initial_predictions() # No need to do it every time
        self.RQ = RQ
        Yt = Y.T 
        self.Y = Y

        self.reg = reg

        self.prediction_scores = predict_scores(matrix_U=self.RQ,
                                                matrix_V=self.Y,
                                                bias=Bias).T
        
        for user in tqdm(self.test_users):
            start_time = time.time()
            # User id starts from 0
            self.row['user_id'] = user
            
            initial_prediction_items = predict_vector(rating_vector=self.prediction_scores[user],
                                                            train_vector=self.matrix_Train[user],
                                                            remove_train=True)
            # For keyphrase selection method 'diff' 
            top_recommended_keyphrase_freq = get_item_keyphrase_freq(self.item_keyphrase_freq,item = initial_prediction_items[0])
            
            # The iteration will stop if the wanted item is in top n
            for target_rank in self.target_ranks:
                self.row['target_rank'] = target_rank
                
                # Pick wanted items in test items
                candidate_items = self.matrix_Test[user].nonzero()[1]
                train_items = self.matrix_Train[user].nonzero()[1]
                wanted_items = np.setdiff1d(candidate_items, train_items)
                
                for item in wanted_items:
                    # Item id starts from 0
                    self.row['item_id'] = item
                    try:
                        self.row['item_name'] = get_restaurant_name(df_train, business_df,item)
                    except:
                        self.row['item_name'] = 'NOT_FOUND'
                    # Set the wanted item's initial rank as None
                    self.row['item_rank'] = None
                    # Set the wanted item's initial prediction score as None
                    self.row['item_score'] = None
                    
                    if self.keyphrase_selection_method == "random" or self.keyphrase_selection_method == "pop":
                        # Get the item's existing keyphrases (we can boost)
                        remaining_keyphrases = self.item_keyphrase_freq[item].nonzero()[1]
                    if self.keyphrase_selection_method == "diff":
                        # For keyphrase selection method 'diff' 
                        target_keyphrase_freq = get_item_keyphrase_freq(self.item_keyphrase_freq,item = item)
                        diff_keyphrase_freq = target_keyphrase_freq - top_recommended_keyphrase_freq
                        remaining_keyphrases = np.argsort(np.ravel(diff_keyphrase_freq))[::-1][:self.max_wanted_keyphrase]
                        
#                    print("The number of remaining_keyphrases is {}. remaining_keyphrases are: {}".format(len(remaining_keyphrases), remaining_keyphrases))
                    self.row['num_existing_keyphrases'] = len(remaining_keyphrases)
                    if len(remaining_keyphrases) == 0:
                        break
                    self.row['iteration'] = 0
                    self.row['critiqued_keyphrase'] = None
                    self.row['result'] = None
                    self.df = self.df.append(self.row, ignore_index=True)

                    query = []
                    affected_items = np.array([])
                    
                    # Set up latent embedding
                    user_latent_embedding = [Y[user]]
                    
                    for iteration in range(self.max_iteration_threshold):
                        self.row['iteration'] = iteration + 1
                                                
                        if self.keyphrase_selection_method == "pop":
                            # Always critique the most popular keyphrase
                            critiqued_keyphrase = remaining_keyphrases[np.argmax(self.keyphrase_popularity[remaining_keyphrases])]
    #                        print("remaining keyphrases popularity: {}".format(self.keyphrase_popularity[remaining_keyphrases]))
                        elif self.keyphrase_selection_method == "random":
                            critiqued_keyphrase = np.random.choice(remaining_keyphrases, size=1, replace=False)[0]
            
                        elif self.keyphrase_selection_method == "diff":
                            critiqued_keyphrase = remaining_keyphrases[0]
#                             print ('critiqued_keyphrase', critiqued_keyphrase)
                        
                        self.row['critiqued_keyphrase'] = critiqued_keyphrase
                        self.row['critiqued_keyphrase_name'] = keyphrases_names[critiqued_keyphrase]
                        query.append(critiqued_keyphrase)

                        # Get affected items (items have critiqued keyphrase)
                        current_affected_items = self.item_keyphrase_freq[:, critiqued_keyphrase].nonzero()[0]
                        affected_items = np.unique(np.concatenate((affected_items, current_affected_items))).astype(int)
                        unaffected_items = np.setdiff1d(range(self.num_items), affected_items)

                        if iteration == 0:
                            prediction_items = initial_prediction_items #calculated once for each user

                        affected_items_mask = np.in1d(prediction_items, affected_items)
                        affected_items_index_rank = np.where(affected_items_mask == True)
                        unaffected_items_index_rank = np.where(affected_items_mask == False)

                        import copy
                        
                        ## concat critique embeddings to user latent embedding
                        # Get critique vector 
                        critiqued_vector = np.zeros(self.keyphrase_freq.shape[1])
                        critiqued_vector[critiqued_keyphrase] = max(self.keyphrase_freq[user , critiqued_keyphrase],1)
                        # map user critique to user latent embedding
                        k_ci = reg.predict(critiqued_vector.reshape(1, -1)).flatten()
                        user_latent_embedding.append(k_ci)
#                         print ('user latent embedding shape: ', np.array(user_latent_embedding).shape)

                        
#                         prediction_scores_u, lambdas = Average(initial_prediction_u=self.prediction_scores[user],
#                                                                              keyphrase_freq=copy.deepcopy(self.keyphrase_freq),
#                                                                              affected_items=np.intersect1d(affected_items, prediction_items[affected_items_index_rank[0][:20]]),
#                                                                              unaffected_items=np.intersect1d(unaffected_items, prediction_items[unaffected_items_index_rank[0][:20]]),
#                                                                              num_keyphrases=self.num_keyphrases,
#                                                                              query=query,
#                                                                              test_user=user,
#                                                                              item_latent=self.RQ,
#                                                                              reg=self.reg)
                        prediction_scores_u, lambdas = LP1SimplifiedOptimize(initial_prediction_u=self.prediction_scores[user],
                                                                             keyphrase_freq=copy.deepcopy(self.keyphrase_freq),
                                                                             affected_items=np.intersect1d(affected_items, prediction_items[affected_items_index_rank[0][:20]]),
                                                                             unaffected_items=np.intersect1d(unaffected_items, prediction_items[unaffected_items_index_rank[0][:20]]),
                                                                             num_keyphrases=self.num_keyphrases,
                                                                             query=query,
                                                                             test_user=user,
                                                                             item_latent=self.RQ,
                                                                             reg=self.reg)
#                         prediction_scores_u, lambdas = rankSVM(initial_prediction_u=self.prediction_scores[user],
#                                                                              keyphrase_freq=copy.deepcopy(self.keyphrase_freq),
#                                                                              affected_items=np.intersect1d(affected_items, prediction_items[affected_items_index_rank[0][:20]]),
#                                                                              unaffected_items=np.intersect1d(unaffected_items, prediction_items[unaffected_items_index_rank[0][:20]]),
#                                                                              num_keyphrases=self.num_keyphrases,
#                                                                              query=query,
#                                                                              test_user=user,
#                                                                              item_latent=self.RQ,
#                                                                              reg=self.reg,
#                                                                              user_latent_embedding = user_latent_embedding,
#                                                                              item_keyphrase_freq = all_item_keyphrase_freq
#                                                                              )
#                         prediction_scores_u, lambdas = rankSVM2(initial_prediction_u=self.prediction_scores[user],
#                                                                              keyphrase_freq=copy.deepcopy(self.keyphrase_freq),
#                                                                              affected_items=np.intersect1d(affected_items, prediction_items[affected_items_index_rank[0][:20]]),
#                                                                              unaffected_items=np.intersect1d(unaffected_items, prediction_items[unaffected_items_index_rank[0][:20]]),
#                                                                              num_keyphrases=self.num_keyphrases,
#                                                                              query=query,
#                                                                              test_user=user,
#                                                                              item_latent=self.RQ,
#                                                                              reg=self.reg,
#                                                                              user_latent_embedding = user_latent_embedding,
#                                                                              item_keyphrase_freq = all_item_keyphrase_freq,
#                                                                              lamb = self.lamb
#                                                                              )    
#                         prediction_scores_u, lambdas = rankSVM3(initial_prediction_u=self.prediction_scores[user],
#                                                                              keyphrase_freq=copy.deepcopy(self.keyphrase_freq),
#                                                                              affected_items=np.intersect1d(affected_items, prediction_items[affected_items_index_rank[0][:20]]),
#                                                                              unaffected_items=np.intersect1d(unaffected_items, prediction_items[unaffected_items_index_rank[0][:20]]),
#                                                                              num_keyphrases=self.num_keyphrases,
#                                                                              query=query,
#                                                                              test_user=user,
#                                                                              item_latent=self.RQ,
#                                                                              reg=self.reg,
#                                                                              user_latent_embedding = user_latent_embedding,
#                                                                              item_keyphrase_freq = all_item_keyphrase_freq,
#                                                                              lamb = self.lamb
#                                                                              )                       
    
#                         item_keyphrase_freq = get_all_item_keyphrase_freq()
                        
                        self.row['lambda'] = lambdas
                        prediction_items = predict_vector(rating_vector=prediction_scores_u,
                                                          train_vector=self.matrix_Train[user],
                                                          remove_train=False)
                        recommended_items = prediction_items
                        
                        # Current item rank
                        item_rank = np.where(recommended_items == item)[0][0]

                        self.row['item_rank'] = item_rank
                        self.row['item_score'] = prediction_scores_u[item]

                        if item_rank + 1 <= target_rank:
                            # Items is ranked within target rank
                            self.row['result'] = 'successful'
                            self.df = self.df.append(self.row, ignore_index=True)
                            break
                        else:
                            remaining_keyphrases = np.setdiff1d(remaining_keyphrases, critiqued_keyphrase)
                            # Continue if more keyphrases and iterations remained
                            if len(remaining_keyphrases) > 0 and self.row['iteration'] < self.max_iteration_threshold:
                                self.row['result'] = None
                                self.df = self.df.append(self.row, ignore_index=True)
                            else:
                                # Otherwise, mark fail
                                self.row['result'] = 'fail'
                                self.df = self.df.append(self.row, ignore_index=True)
                                break
#                         break ## For Testing LP Objective
        
            print("User ", user ,"Elapsed: {}".format(inhour(time.time() - start_time)))
        return self.df


    def get_initial_predictions(self):
        self.RQ, Yt, Bias = plrec(self.matrix_Train,
                                       iteration=self.parameters_row['iter'],
                                       lamb=self.parameters_row['lambda'],
                                       rank=self.parameters_row['rank'])
        self.Y = Yt.T

        self.reg = LinearRegression().fit(self.keyphrase_freq, self.RQ)

        self.prediction_scores = predict_scores(matrix_U=self.RQ,
                                                matrix_V=self.Y,
                                                bias=Bias)



In [99]:
row = {}
matrix_Train = rtrain
matrix_Test = rtest
# test_users = np.arange(25)
test_users = [1]
target_ranks = [20, 50]
num_items_sampled = 5
num_keyphrases = 235
df = pd.DataFrame(row)
max_iteration_threshold = 20
keyphrase_popularity = keyphrase_popularity
dataset_name = "yelp"
model = "plrec"
parameters_row = {'iter': 10,
                  'lambda':200,
                  'rank':200}
keyphrases_names = keyphrases
keyphrase_selection_method = 'diff'
max_wanted_keyphrase = 20
lamb = [1000,1]
critiquing_model = LP1Simplified(keyphrase_freq=U_K,
                                item_keyphrase_freq=I_K,
                                row=row,
                                matrix_Train=matrix_Train,
                                matrix_Test=matrix_Test,
                                test_users=test_users,
                                target_ranks=target_ranks,
                                num_items_sampled=num_items_sampled,
                                num_keyphrases=num_keyphrases,
                                df=df,
                                max_iteration_threshold=max_iteration_threshold,
                                keyphrase_popularity=keyphrase_popularity,
                                dataset_name=dataset_name,
                                model=model,
                                parameters_row=parameters_row,
                                keyphrases_names = keyphrases_names,
                                keyphrase_selection_method = keyphrase_selection_method,
                                max_wanted_keyphrase = max_wanted_keyphrase,
                                lamb = lamb)
df = critiquing_model.start_critiquing()

table_path = '../tables/critiquing/multi_step_critiquing/yelp/rating/'
name = 'rating_test.csv'
save_dataframe_csv(df, table_path, name)

  0%|          | 0/1 [00:00<?, ?it/s]

affected_items [  46 2320 2489 2906 3147 3244 3347 3699 3883 4729 4895 4901 5081 5136
 5436 5558 5993 6493 6568 6660]
46
unaffected_items [ 635  870 1061 1107 1527 1940 2525 2882 2975 3183 3260 3335 3337 3997
 4358 4673 4758 5870 6472 7056]
635
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 1 columns and 0 nonzeros
Model fingerprint: 0x292699f2
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [2e+02, 2e+02]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 1 columns
Presolve time: 0.01s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.0262173e+02   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.026217294e+02
Elapsed: 00:00:00
affected_items [ 870 1061 1940 2525 2906 2975 3183 3213 3244 3347 3699 3883 3889 4358
 4673 4901 4940 5639 5870 6660]
870
unaffected_it

  Matrix range     [0e+00, 0e+00]
  Objective range  [1e+02, 2e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 9 columns
Presolve time: 0.01s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    4.8039047e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  4.803904748e+03
Elapsed: 00:00:00
affected_items [  75   97  376  683 1090 1107 1113 2804 3499 3539 4037 4164 4443 5371
 5626 5985 6299 6732 6776 7100]
75
unaffected_items [ 722  892 1278 1461 1903 2195 2886 3171 4147 4543 4966 5268 5449 6040
 6288 6466 6636 6982 7137 7325]
722
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 10 columns and 0 nonzeros
Model fingerprint: 0x1aedced7
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [2e+01, 2e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00

Optimal objective  9.105475573e+03
Elapsed: 00:00:00
affected_items [ 683 1090 1107 1113 2188 2804 2925 3402 3499 4164 4443 5326 5371 5626
 5659 5763 6353 6776 7034 7100]
683
unaffected_items [ 582  892 1278 1952 2644 2693 2864 3242 3431 3905 4147 4543 4824 5023
 5246 5738 6294 6472 6636 6830]
582
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 19 columns and 0 nonzeros
Model fingerprint: 0xf13f49fa
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [2e+01, 2e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 19 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    9.1768865e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  9.176886489e+03
Elapsed: 00:00:00
affected_items [ 683 1090 1107 1113 2188 2804 2925 3402 3499 4164 4443 5326 537

Model fingerprint: 0x27dbc636
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [2e+01, 2e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 8 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    6.5532000e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  6.553199956e+03
Elapsed: 00:00:00
affected_items [ 683  735 1113 2154 2729 2804 2895 3166 3260 4443 4664 4928 5010 5340
 5410 5626 6131 6454 6776 7163]
683
unaffected_items [  19 1028 1085 1461 1903 2201 2644 2886 3933 4740 4966 5533 6040 6061
 6348 6559 6602 6636 6969 7413]
19
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 9 columns and 0 nonzeros
Model fingerprint: 0xcea53d88
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [7e+01, 2e+03]
  Bounds rang


Solved in 0 iterations and 0.01 seconds
Optimal objective  1.370478734e+04
Elapsed: 00:00:00
affected_items [ 419  585  683 1113 2804 2894 2895 3211 3512 4397 4443 5326 5363 5410
 5626 5659 5870 6454 6776 7163]
419
unaffected_items [ 544  580 1414 1442 2171 2236 2471 2693 2722 3941 4021 4156 4232 4804
 4896 5681 5779 6181 6339 6693]
544
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 18 columns and 0 nonzeros
Model fingerprint: 0xf6603060
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [7e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 18 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.3776293e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.377629259e+04
Elapsed: 00:00:00
affected_items [  97  419  585  683 11

Model fingerprint: 0xa4869721
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [1e+02, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 7 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    8.2995130e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  8.299512982e+03
Elapsed: 00:00:00
affected_items [  75 1548 1898 2364 2412 2517 2729 2895 3097 4443 5098 5158 5315 5725
 6301 6454 6498 6660 7205 7213]
75
unaffected_items [  40 1363 1414 1980 2315 2433 2534 3532 3614 4966 5136 5310 5759 5853
 6267 6348 6778 6789 6800 6974]
40
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 8 columns and 0 nonzeros
Model fingerprint: 0x46b1e64a
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [7e+01, 3e+03]
  Bounds range


Solved in 0 iterations and 0.01 seconds
Optimal objective  1.390769249e+04
Elapsed: 00:00:00
affected_items [  75  325  585 1548 2412 2804 2847 2895 4072 4443 4908 5098 5340 5410
 6454 6498 6660 6938 7205 7213]
75
unaffected_items [ 366  944 1110 1414 1935 1962 2697 2755 3532 3720 4078 4298 5030 5208
 5500 5802 6264 6426 6941 7103]
366
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 17 columns and 0 nonzeros
Model fingerprint: 0x5fec63d2
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [3e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 17 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.4154410e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.415440960e+04
Elapsed: 00:00:00
affected_items [  75  325  585 1548 241

Optimize a model with 0 rows, 6 columns and 0 nonzeros
Model fingerprint: 0xd0cb2e4e
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [1e+02, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 6 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    7.1692744e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  7.169274418e+03
Elapsed: 00:00:00
affected_items [1406 1445 1548 1985 2446 2804 3997 4141 4582 4786 4848 5047 5315 5659
 5870 6222 6454 6582 7137 7286]
1406
unaffected_items [  77 1122 1210 1300 1896 1980 2521 3863 4087 4360 4554 4824 5005 5478
 6240 6571 6577 6673 7118 7357]
77
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 7 columns and 0 nonzeros
Model fingerprint: 0xe0276fcc
Coefficient statistics:
  Matrix range     [0e+00

       0    1.5456275e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.545627521e+04
Elapsed: 00:00:00
affected_items [1406 1445 1548 1652 2754 2804 3347 3997 4458 4786 4848 5047 5315 5410
 5659 5870 6222 6454 6582 6739]
1406
unaffected_items [ 231 1168 1184 1525 2060 2377 2471 2920 3142 3146 3181 3977 5198 6289
 6894 7076 7184 7297 7362 7421]
231
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 16 columns and 0 nonzeros
Model fingerprint: 0x75cf3941
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [9e+01, 2e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 16 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.5685830e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.00 seconds
Optimal objective  1.56858

Optimize a model with 0 rows, 5 columns and 0 nonzeros
Model fingerprint: 0x721cd737
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [8e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 5 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    5.1656809e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  5.165680939e+03
Elapsed: 00:00:00
affected_items [  97 1522 1898 2364 2729 3428 4037 4443 4786 4848 5010 5098 5410 5730
 5852 6167 6353 6634 6644 7213]
97
unaffected_items [ 484  822 1743 1779 1980 2438 2534 2845 3286 4078 4255 5327 5469 5500
 5738 5773 5856 6608 7240 7243]
484
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 6 columns and 0 nonzeros
Model fingerprint: 0x659eed0a
Coefficient statistics:
  Matrix range     [0e+00,

       0    1.2694761e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.269476108e+04
Elapsed: 00:00:00
affected_items [1107 2188 2446 2729 2804 2916 3499 4443 4786 5131 5371 5626 5763 5985
 6004 6251 6299 6353 6776 7034]
1107
unaffected_items [ 318  484  516  554 1923 1980 3242 3312 3669 3905 4640 4740 4776 4824
 4830 5058 6117 6971 6992 7014]
318
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 15 columns and 0 nonzeros
Model fingerprint: 0x6ad75b33
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [1e+02, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 15 columns
Presolve time: 0.01s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.3263130e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.32631

Optimize a model with 0 rows, 4 columns and 0 nonzeros
Model fingerprint: 0x3efdda51
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [2e+01, 2e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 4 columns
Presolve time: 0.01s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    2.5982173e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  2.598217319e+03
Elapsed: 00:00:00
affected_items [  75 1340 1548 1985 2446 2804 2895 3997 4786 5047 5081 5315 5340 5410
 5498 5763 6222 6454 6582 7286]
75
unaffected_items [ 486 1367 1410 1710 1787 1798 1880 2433 2644 2657 2694 2921 3337 3683
 3728 4087 4563 4835 5150 6773]
486
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 5 columns and 0 nonzeros
Model fingerprint: 0x14b0f413
Coefficient statistics:
  Matrix range     [0e+00,

       0    8.2653698e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  8.265369815e+03
Elapsed: 00:00:00
affected_items [ 683 1113 1159 1340 1445 1652 2804 3382 3428 3997 4195 4458 5410 5422
 5498 5659 5870 6222 6454 6776]
683
unaffected_items [ 599 1556 2471 2689 2692 2879 3977 4078 4660 5072 5198 5549 5635 5795
 6181 6464 6693 6894 7073 7184]
599
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 14 columns and 0 nonzeros
Model fingerprint: 0xb1c716d8
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [3e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 14 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    8.3764823e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  8.376482

Optimize a model with 0 rows, 3 columns and 0 nonzeros
Model fingerprint: 0xdbe8e29b
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [4e+02, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 3 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    5.2234108e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  5.223410825e+03
Elapsed: 00:00:00
affected_items [  97  585 1898 2364 2412 2729 2957 3211 4141 4443 4550 4673 5052 5098
 5852 6299 6498 7034 7205 7213]
97
unaffected_items [ 315  395  484 1192 1713 2086 2497 2885 3408 3861 3993 4268 4966 5046
 5738 6152 6170 6830 7157 7339]
315
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 4 columns and 0 nonzeros
Model fingerprint: 0x3af04c78
Coefficient statistics:
  Matrix range     [0e+00,

       0    1.2443751e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.244375069e+04
Elapsed: 00:00:00
affected_items [  97  585 1548 2729 2895 3097 4195 4443 4550 4673 4848 5098 5315 5364
 5410 5852 6454 6498 7205 7213]
97
unaffected_items [  29  178 1168 1414 1917 2689 2697 2722 2850 2938 3532 4068 4260 5802
 5878 6193 6693 6722 6834 7243]
29
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 13 columns and 0 nonzeros
Model fingerprint: 0xebe78bd7
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [7e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 13 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.3001498e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.30014984

Optimize a model with 0 rows, 2 columns and 0 nonzeros
Model fingerprint: 0x395d316e
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [3e+02, 1e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 2 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.6531460e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.653146047e+03
Elapsed: 00:00:00
affected_items [ 419  926 1082 2157 2804 3333 3402 3428 4141 4358 4443 4848 5108 5340
 5363 5852 6519 6568 6947 7286]
419
unaffected_items [ 252  594  861  905 1315 1410 1689 2135 2190 2414 2735 3156 3429 4293
 4984 5371 6040 6580 6628 7317]
252
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 3 columns and 0 nonzeros
Model fingerprint: 0xc7812f0b
Coefficient statistics:
  Matrix range     [0e+00

       0    7.6450695e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  7.645069479e+03
Elapsed: 00:00:00
affected_items [  43  419  637  683 1522 1608 2089 2157 2804 2847 3149 3428 4443 5363
 5972 6739 6776 7100 7163 7286]
43
unaffected_items [ 313  349  541 1838 2453 2464 2529 3142 3146 3777 3784 3941 3977 4217
 4248 4515 4740 6618 6677 7279]
313
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 12 columns and 0 nonzeros
Model fingerprint: 0x6b330b8c
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [1e+01, 2e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 12 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    7.9283197e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  7.9283197

Optimize a model with 0 rows, 1 columns and 0 nonzeros
Model fingerprint: 0x46aa340a
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [8e+00, 8e+00]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 1 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.5101096e+02   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.510109589e+02
Elapsed: 00:00:00
affected_items [  82   97  585 1898 2364 2412 2517 2847 3211 3980 4443 5098 5725 5852
 6498 7010 7034 7205 7207 7213]
82
unaffected_items [ 484 1079 1172 1743 1980 2152 2497 2534 2583 2845 2885 3286 4369 5136
 5738 6152 6170 6192 6800 7339]
484
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 2 columns and 0 nonzeros
Model fingerprint: 0x27f5492e
Coefficient statistics:
  Matrix range     [0e+00,

       0    8.4091234e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  8.409123394e+03
Elapsed: 00:00:00
affected_items [  75   97  926 1548 1584 1898 1985 2729 2895 3428 4443 4848 5098 5852
 6353 6454 6498 6744 7205 7213]
75
unaffected_items [ 484 1172 1363 1410 1414 1525 1549 1980 2116 2169 2438 2534 2697 2866
 3286 3611 5521 5856 7240 7243]
484
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 11 columns and 0 nonzeros
Model fingerprint: 0x864475fa
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [4e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 11 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    8.9261881e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  8.9261881

Optimize a model with 0 rows, 20 columns and 0 nonzeros
Model fingerprint: 0x876762f8
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [2e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 20 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.3482071e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.348207091e+04
Elapsed: 00:00:00
affected_items [ 870 1527 1940 2320 2525 2882 2906 2975 3260 3337 3347 3699 4358 4673
 4758 4895 4901 5870 6568 7056]
870
unaffected_items [ 446  986 1392 2921 3335 3729 3754 3756 4276 5546 5558 6003 6202 6303
 6390 6472 6493 6636 6680 7196]
446
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 1 columns and 0 nonzeros
Model fingerprint: 0x7b139340
Coefficient statistics:
  Matrix range     [0e+


Solved in 0 iterations and 0.01 seconds
Optimal objective  2.128361970e+03
Elapsed: 00:00:00
affected_items [ 683  735 2528 2925 3347 3368 3512 3739 4443 4599 5315 5340 5371 5626
 6059 6353 6947 7100 7163 7427]
683
unaffected_items [ 646 1410 1665 1743 1787 2229 2315 2609 3905 3941 4369 5066 5150 5204
 6031 6060 6294 6559 6579 7010]
646
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 10 columns and 0 nonzeros
Model fingerprint: 0x349b4225
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [1e+01, 5e+02]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 10 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    2.3570753e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  2.357075341e+03
Elapsed: 00:00:00
affected_items [ 683  735 2528 2925 33

Optimize a model with 0 rows, 19 columns and 0 nonzeros
Model fingerprint: 0x75714ff1
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [3e+01, 2e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 19 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    7.1337948e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  7.133794846e+03
Elapsed: 00:00:00
affected_items [  75  683 2804 2925 2942 3347 3512 4443 5081 5286 5410 5422 5577 5626
 5870 6353 6568 6607 6776 7163]
75
unaffected_items [ 140  224  486 1442 1712 2124 2267 2471 2609 2722 2761 3941 4515 4737
 4740 5372 5634 5773 6636 6982]
140
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 20 columns and 0 nonzeros
Model fingerprint: 0x4a92feec
Coefficient statistics:
  Matrix range     [0e+

       0    9.2018138e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  9.201813841e+03
Elapsed: 00:00:00
affected_items [  82   97  926 1898 2412 2517 2729 3097 3593 4443 4606 4848 5098 5852
 6059 6353 6498 7010 7205 7213]
82
unaffected_items [ 300  395  484  528 1172 1202 1363 1447 1710 1980 2195 2845 3286 3558
 4651 4966 5456 6348 6800 6992]
300
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 9 columns and 0 nonzeros
Model fingerprint: 0x48e0c84a
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [1e+02, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 9 columns
Presolve time: 0.01s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.0154500e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.015450027

Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 18 columns and 0 nonzeros
Model fingerprint: 0x798d0129
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [4e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 18 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    1.3953490e+04   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  1.395349021e+04
Elapsed: 00:00:00
affected_items [  97  585  926 2412 2729 2847 4443 4673 4848 5098 5285 5410 5763 5852
 5985 6251 6353 7034 7205 7213]
97
unaffected_items [ 528  626  666 1363 1365 1575 2059 2845 3242 3286 3479 3613 4313 5497
 5603 5802 5878 5911 6618 7243]
528
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 19 columns and 0 nonzeros
Model fingerprint: 0x3

       0    7.2512539e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  7.251253938e+03
Elapsed: 00:00:00
affected_items [  39  201  727  796 1127 1308 1443 1548 2364 3337 3368 3980 4011 4358
 4671 4786 6047 6353 6454 6667]
39
unaffected_items [ 425  646  996 1433 1694 1934 1982 2565 3494 3566 3852 4087 4822 5198
 5266 5287 6017 6157 6802 6845]
425
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 8 columns and 0 nonzeros
Model fingerprint: 0x62abec75
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [1e+01, 5e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 8 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    7.2676483e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  7.267648263

Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 17 columns and 0 nonzeros
Model fingerprint: 0xee04b5e2
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [7e+00, 4e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 17 columns
Presolve time: 0.01s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    9.1443146e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  9.144314592e+03
Elapsed: 00:00:00
affected_items [  39  201  727  796 1443 1548 2364 3337 3739 3980 4358 4599 4671 4786
 5340 5840 6047 6353 6454 6667]
39
unaffected_items [ 928  996 1184 1433 1442 1600 1980 1982 2736 3390 3494 5531 5603 5911
 6130 6618 6778 6824 7184 7451]
928
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 18 columns and 0 nonzeros
Model fingerprint: 0x5

Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    6.9524967e+03   0.000000e+00   0.000000e+00      0s

Solved in 0 iterations and 0.01 seconds
Optimal objective  6.952496740e+03
Elapsed: 00:00:00
affected_items [  82  585 1090 1709 1898 2412 2517 2804 3204 3593 4443 4606 5725 5763
 6059 6299 6353 6498 7010 7034]
82
unaffected_items [ 395  554  822 1172 1710 1980 2315 2433 2693 2845 3286 4369 5310 5469
 5610 5853 6472 6778 6789 6800]
395
Gurobi Optimizer version 9.0.1 build v9.0.1rc0 (mac64)
Optimize a model with 0 rows, 7 columns and 0 nonzeros
Model fingerprint: 0x454956ee
Coefficient statistics:
  Matrix range     [0e+00, 0e+00]
  Objective range  [5e+01, 3e+03]
  Bounds range     [1e+00, 1e+00]
  RHS range        [0e+00, 0e+00]
Presolve removed 0 rows and 7 columns
Presolve time: 0.00s
Presolve: All rows and columns removed
Iteration    Objective       Primal Inf.    Dual Inf.      Time
       0    7.9600997e+03   0.000000e+00   0.000000e+00      0s

Solved

KeyboardInterrupt: 

# Tune lambda

In [59]:
lambs = [0.01,0.1,1,10,30,50,70,90,100,1000]
for lamb in lambs:
    row = {}
    matrix_Train = rtrain
    matrix_Test = rtest
    test_users = np.arange(25)
#         test_users = [1]
    target_ranks = [20, 50]
    num_items_sampled = 5
    num_keyphrases = 235
    df = pd.DataFrame(row)
    max_iteration_threshold = 20
    keyphrase_popularity = keyphrase_popularity
    dataset_name = "yelp"
    model = "plrec"
    parameters_row = {'iter': 10,
                      'lambda':200,
                      'rank':200}
    keyphrases_names = keyphrases
    keyphrase_selection_method = 'random'
    max_wanted_keyphrase = 20
    critiquing_model = LP1Simplified(keyphrase_freq=U_K,
                                    item_keyphrase_freq=I_K,
                                    row=row,
                                    matrix_Train=matrix_Train,
                                    matrix_Test=matrix_Test,
                                    test_users=test_users,
                                    target_ranks=target_ranks,
                                    num_items_sampled=num_items_sampled,
                                    num_keyphrases=num_keyphrases,
                                    df=df,
                                    max_iteration_threshold=max_iteration_threshold,
                                    keyphrase_popularity=keyphrase_popularity,
                                    dataset_name=dataset_name,
                                    model=model,
                                    parameters_row=parameters_row,
                                    keyphrases_names = keyphrases_names,
                                    keyphrase_selection_method = keyphrase_selection_method,
                                    max_wanted_keyphrase = max_wanted_keyphrase,
                                    lamb = lamb)
    df = critiquing_model.start_critiquing()

    table_path = '../tables/critiquing/tuning_ranksvm3/'
    name = 'lamb_'+ str(lamb) + '_test.csv'
    save_dataframe_csv(df, table_path, name)

  4%|▍         | 1/25 [00:06<02:46,  6.96s/it]

User  0 Elapsed: 00:00:06


  8%|▊         | 2/25 [00:37<05:24, 14.12s/it]

User  1 Elapsed: 00:00:30


 12%|█▏        | 3/25 [00:46<04:35, 12.51s/it]

User  2 Elapsed: 00:00:08


 16%|█▌        | 4/25 [00:55<03:57, 11.30s/it]

User  3 Elapsed: 00:00:08


 20%|██        | 5/25 [00:59<03:08,  9.40s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:05<02:38,  8.32s/it]

User  5 Elapsed: 00:00:05


 28%|██▊       | 7/25 [01:11<02:13,  7.40s/it]

User  6 Elapsed: 00:00:05


 32%|███▏      | 8/25 [01:15<01:49,  6.45s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:21<01:42,  6.40s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:29<01:43,  6.88s/it]

User  9 Elapsed: 00:00:07


 44%|████▍     | 11/25 [01:38<01:47,  7.65s/it]

User  10 Elapsed: 00:00:09


 48%|████▊     | 12/25 [01:48<01:46,  8.18s/it]

User  11 Elapsed: 00:00:09


 52%|█████▏    | 13/25 [01:56<01:36,  8.08s/it]

User  12 Elapsed: 00:00:07


 56%|█████▌    | 14/25 [02:07<01:38,  8.95s/it]

User  13 Elapsed: 00:00:10


 60%|██████    | 15/25 [02:15<01:26,  8.64s/it]

User  14 Elapsed: 00:00:07
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:31<01:07,  8.44s/it]

User  16 Elapsed: 00:00:15


 72%|███████▏  | 18/25 [02:51<01:23, 11.96s/it]

User  17 Elapsed: 00:00:20


 76%|███████▌  | 19/25 [03:01<01:07, 11.30s/it]

User  18 Elapsed: 00:00:09


 80%|████████  | 20/25 [03:17<01:04, 12.99s/it]

User  19 Elapsed: 00:00:16


 84%|████████▍ | 21/25 [03:29<00:50, 12.53s/it]

User  20 Elapsed: 00:00:11


 88%|████████▊ | 22/25 [03:39<00:35, 11.92s/it]

User  21 Elapsed: 00:00:10


 92%|█████████▏| 23/25 [03:44<00:19,  9.68s/it]

User  22 Elapsed: 00:00:04
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:48<00:00,  9.15s/it]
  0%|          | 0/25 [00:00<?, ?it/s]

User  24 Elapsed: 00:00:04


  4%|▍         | 1/25 [00:07<02:56,  7.34s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:40<05:47, 15.12s/it]

User  1 Elapsed: 00:00:33


 12%|█▏        | 3/25 [00:48<04:45, 12.95s/it]

User  2 Elapsed: 00:00:07


 16%|█▌        | 4/25 [00:56<04:00, 11.45s/it]

User  3 Elapsed: 00:00:07


 20%|██        | 5/25 [01:01<03:10,  9.50s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:07<02:41,  8.48s/it]

User  5 Elapsed: 00:00:06


 28%|██▊       | 7/25 [01:13<02:16,  7.58s/it]

User  6 Elapsed: 00:00:05


 32%|███▏      | 8/25 [01:17<01:54,  6.73s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:24<01:48,  6.76s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:33<01:49,  7.28s/it]

User  9 Elapsed: 00:00:08


 44%|████▍     | 11/25 [01:42<01:50,  7.92s/it]

User  10 Elapsed: 00:00:09


 48%|████▊     | 12/25 [01:53<01:53,  8.71s/it]

User  11 Elapsed: 00:00:10


 52%|█████▏    | 13/25 [02:01<01:42,  8.54s/it]

User  12 Elapsed: 00:00:08


 56%|█████▌    | 14/25 [02:11<01:39,  9.05s/it]

User  13 Elapsed: 00:00:10


 60%|██████    | 15/25 [02:18<01:24,  8.47s/it]

User  14 Elapsed: 00:00:07
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:34<01:06,  8.37s/it]

User  16 Elapsed: 00:00:16


 72%|███████▏  | 18/25 [02:56<01:25, 12.27s/it]

User  17 Elapsed: 00:00:21


 76%|███████▌  | 19/25 [03:06<01:09, 11.60s/it]

User  18 Elapsed: 00:00:10


 80%|████████  | 20/25 [03:23<01:06, 13.24s/it]

User  19 Elapsed: 00:00:17


 84%|████████▍ | 21/25 [03:34<00:50, 12.68s/it]

User  20 Elapsed: 00:00:11


 88%|████████▊ | 22/25 [03:45<00:36, 12.00s/it]

User  21 Elapsed: 00:00:10


 92%|█████████▏| 23/25 [03:50<00:19,  9.98s/it]

User  22 Elapsed: 00:00:05
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:54<00:00,  9.39s/it]
  0%|          | 0/25 [00:00<?, ?it/s]

User  24 Elapsed: 00:00:04


  4%|▍         | 1/25 [00:07<02:55,  7.33s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:41<05:55, 15.45s/it]

User  1 Elapsed: 00:00:34


 12%|█▏        | 3/25 [00:49<04:48, 13.12s/it]

User  2 Elapsed: 00:00:07


 16%|█▌        | 4/25 [00:57<04:04, 11.64s/it]

User  3 Elapsed: 00:00:08


 20%|██        | 5/25 [01:02<03:09,  9.47s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:08<02:40,  8.44s/it]

User  5 Elapsed: 00:00:06


 28%|██▊       | 7/25 [01:13<02:15,  7.53s/it]

User  6 Elapsed: 00:00:05


 32%|███▏      | 8/25 [01:18<01:54,  6.72s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:25<01:47,  6.72s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:33<01:49,  7.27s/it]

User  9 Elapsed: 00:00:08


 44%|████▍     | 11/25 [01:43<01:53,  8.12s/it]

User  10 Elapsed: 00:00:10


 48%|████▊     | 12/25 [01:53<01:54,  8.77s/it]

User  11 Elapsed: 00:00:10


 52%|█████▏    | 13/25 [02:01<01:40,  8.36s/it]

User  12 Elapsed: 00:00:07


 56%|█████▌    | 14/25 [02:12<01:40,  9.12s/it]

User  13 Elapsed: 00:00:10


 60%|██████    | 15/25 [02:20<01:29,  8.92s/it]

User  14 Elapsed: 00:00:08
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:36<01:09,  8.66s/it]

User  16 Elapsed: 00:00:16


 72%|███████▏  | 18/25 [02:57<01:26, 12.31s/it]

User  17 Elapsed: 00:00:20


 76%|███████▌  | 19/25 [03:07<01:10, 11.67s/it]

User  18 Elapsed: 00:00:10


 80%|████████  | 20/25 [03:24<01:06, 13.25s/it]

User  19 Elapsed: 00:00:16


 84%|████████▍ | 21/25 [03:36<00:50, 12.73s/it]

User  20 Elapsed: 00:00:11


 88%|████████▊ | 22/25 [03:46<00:36, 12.01s/it]

User  21 Elapsed: 00:00:10


 92%|█████████▏| 23/25 [03:51<00:19,  9.91s/it]

User  22 Elapsed: 00:00:05
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:56<00:00,  9.45s/it]

User  24 Elapsed: 00:00:04



  4%|▍         | 1/25 [00:07<02:55,  7.29s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:41<05:54, 15.43s/it]

User  1 Elapsed: 00:00:34


 12%|█▏        | 3/25 [00:49<04:48, 13.11s/it]

User  2 Elapsed: 00:00:07


 16%|█▌        | 4/25 [00:57<04:02, 11.53s/it]

User  3 Elapsed: 00:00:07


 20%|██        | 5/25 [01:01<03:07,  9.39s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:07<02:41,  8.48s/it]

User  5 Elapsed: 00:00:06


 28%|██▊       | 7/25 [01:13<02:16,  7.57s/it]

User  6 Elapsed: 00:00:05


 32%|███▏      | 8/25 [01:18<01:56,  6.85s/it]

User  7 Elapsed: 00:00:05


 36%|███▌      | 9/25 [01:25<01:48,  6.76s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:32<01:44,  6.99s/it]

User  9 Elapsed: 00:00:07


 44%|████▍     | 11/25 [01:41<01:47,  7.68s/it]

User  10 Elapsed: 00:00:09


 48%|████▊     | 12/25 [01:52<01:51,  8.55s/it]

User  11 Elapsed: 00:00:10


 52%|█████▏    | 13/25 [02:01<01:42,  8.55s/it]

User  12 Elapsed: 00:00:08


 56%|█████▌    | 14/25 [02:11<01:40,  9.15s/it]

User  13 Elapsed: 00:00:10


 60%|██████    | 15/25 [02:20<01:29,  8.97s/it]

User  14 Elapsed: 00:00:08
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:36<01:10,  8.78s/it]

User  16 Elapsed: 00:00:16


 72%|███████▏  | 18/25 [02:57<01:27, 12.45s/it]

User  17 Elapsed: 00:00:21


 76%|███████▌  | 19/25 [03:06<01:08, 11.38s/it]

User  18 Elapsed: 00:00:08


 80%|████████  | 20/25 [03:24<01:05, 13.17s/it]

User  19 Elapsed: 00:00:17


 84%|████████▍ | 21/25 [03:35<00:50, 12.71s/it]

User  20 Elapsed: 00:00:11


 88%|████████▊ | 22/25 [03:46<00:36, 12.17s/it]

User  21 Elapsed: 00:00:10


 92%|█████████▏| 23/25 [03:51<00:19,  9.90s/it]

User  22 Elapsed: 00:00:04
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:55<00:00,  9.44s/it]

User  24 Elapsed: 00:00:04



  4%|▍         | 1/25 [00:07<02:51,  7.14s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:41<05:54, 15.41s/it]

User  1 Elapsed: 00:00:34


 12%|█▏        | 3/25 [00:50<04:53, 13.32s/it]

User  2 Elapsed: 00:00:08


 16%|█▌        | 4/25 [00:58<04:07, 11.79s/it]

User  3 Elapsed: 00:00:08


 20%|██        | 5/25 [01:03<03:12,  9.64s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:08<02:40,  8.46s/it]

User  5 Elapsed: 00:00:05


 28%|██▊       | 7/25 [01:14<02:15,  7.52s/it]

User  6 Elapsed: 00:00:05


 32%|███▏      | 8/25 [01:18<01:53,  6.70s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:25<01:48,  6.79s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:34<01:49,  7.33s/it]

User  9 Elapsed: 00:00:08


 44%|████▍     | 11/25 [01:45<01:58,  8.47s/it]

User  10 Elapsed: 00:00:11


 48%|████▊     | 12/25 [01:56<01:57,  9.03s/it]

User  11 Elapsed: 00:00:10


 52%|█████▏    | 13/25 [02:04<01:45,  8.81s/it]

User  12 Elapsed: 00:00:08


 56%|█████▌    | 14/25 [02:15<01:45,  9.64s/it]

User  13 Elapsed: 00:00:11


 60%|██████    | 15/25 [02:24<01:32,  9.24s/it]

User  14 Elapsed: 00:00:08
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:41<01:12,  9.07s/it]

User  16 Elapsed: 00:00:17


 72%|███████▏  | 18/25 [03:01<01:25, 12.27s/it]

User  17 Elapsed: 00:00:19


 76%|███████▌  | 19/25 [03:10<01:07, 11.27s/it]

User  18 Elapsed: 00:00:08


 80%|████████  | 20/25 [03:26<01:03, 12.77s/it]

User  19 Elapsed: 00:00:16


 84%|████████▍ | 21/25 [03:38<00:50, 12.52s/it]

User  20 Elapsed: 00:00:11


 88%|████████▊ | 22/25 [03:47<00:34, 11.64s/it]

User  21 Elapsed: 00:00:09


 92%|█████████▏| 23/25 [03:52<00:19,  9.57s/it]

User  22 Elapsed: 00:00:04
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:57<00:00,  9.50s/it]

User  24 Elapsed: 00:00:04



  4%|▍         | 1/25 [00:07<02:48,  7.01s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:42<05:55, 15.44s/it]

User  1 Elapsed: 00:00:35


 12%|█▏        | 3/25 [00:49<04:46, 13.03s/it]

User  2 Elapsed: 00:00:07


 16%|█▌        | 4/25 [00:57<04:00, 11.44s/it]

User  3 Elapsed: 00:00:07


 20%|██        | 5/25 [01:01<03:04,  9.22s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:06<02:33,  8.06s/it]

User  5 Elapsed: 00:00:05


 28%|██▊       | 7/25 [01:12<02:10,  7.26s/it]

User  6 Elapsed: 00:00:05


 32%|███▏      | 8/25 [01:16<01:49,  6.45s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:23<01:43,  6.50s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:31<01:44,  6.97s/it]

User  9 Elapsed: 00:00:08


 44%|████▍     | 11/25 [01:41<01:51,  8.00s/it]

User  10 Elapsed: 00:00:10


 48%|████▊     | 12/25 [01:50<01:47,  8.23s/it]

User  11 Elapsed: 00:00:08


 52%|█████▏    | 13/25 [01:58<01:39,  8.29s/it]

User  12 Elapsed: 00:00:08


 56%|█████▌    | 14/25 [02:09<01:37,  8.91s/it]

User  13 Elapsed: 00:00:10


 60%|██████    | 15/25 [02:17<01:27,  8.79s/it]

User  14 Elapsed: 00:00:08
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:33<01:07,  8.50s/it]

User  16 Elapsed: 00:00:15


 72%|███████▏  | 18/25 [02:53<01:23, 11.92s/it]

User  17 Elapsed: 00:00:19


 76%|███████▌  | 19/25 [03:02<01:06, 11.13s/it]

User  18 Elapsed: 00:00:09


 80%|████████  | 20/25 [03:19<01:04, 12.82s/it]

User  19 Elapsed: 00:00:16


 84%|████████▍ | 21/25 [03:30<00:49, 12.36s/it]

User  20 Elapsed: 00:00:11


 88%|████████▊ | 22/25 [03:39<00:34, 11.41s/it]

User  21 Elapsed: 00:00:09


 92%|█████████▏| 23/25 [03:45<00:19,  9.57s/it]

User  22 Elapsed: 00:00:05
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:49<00:00,  9.19s/it]

User  24 Elapsed: 00:00:04



  4%|▍         | 1/25 [00:07<02:52,  7.20s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:38<05:34, 14.56s/it]

User  1 Elapsed: 00:00:31


 12%|█▏        | 3/25 [00:46<04:35, 12.53s/it]

User  2 Elapsed: 00:00:07


 16%|█▌        | 4/25 [00:53<03:49, 10.95s/it]

User  3 Elapsed: 00:00:07


 20%|██        | 5/25 [00:58<03:00,  9.02s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:03<02:30,  7.91s/it]

User  5 Elapsed: 00:00:05


 28%|██▊       | 7/25 [01:08<02:02,  6.80s/it]

User  6 Elapsed: 00:00:04


 32%|███▏      | 8/25 [01:12<01:44,  6.12s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:18<01:38,  6.14s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:26<01:37,  6.52s/it]

User  9 Elapsed: 00:00:07


 44%|████▍     | 11/25 [01:36<01:47,  7.71s/it]

User  10 Elapsed: 00:00:10


 48%|████▊     | 12/25 [01:46<01:48,  8.37s/it]

User  11 Elapsed: 00:00:09


 52%|█████▏    | 13/25 [01:54<01:40,  8.35s/it]

User  12 Elapsed: 00:00:08


 56%|█████▌    | 14/25 [02:04<01:35,  8.69s/it]

User  13 Elapsed: 00:00:09


 60%|██████    | 15/25 [02:12<01:24,  8.50s/it]

User  14 Elapsed: 00:00:08
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:28<01:06,  8.34s/it]

User  16 Elapsed: 00:00:15


 72%|███████▏  | 18/25 [02:48<01:22, 11.74s/it]

User  17 Elapsed: 00:00:19


 76%|███████▌  | 19/25 [02:57<01:05, 10.95s/it]

User  18 Elapsed: 00:00:09


 80%|████████  | 20/25 [03:12<01:01, 12.38s/it]

User  19 Elapsed: 00:00:15


 84%|████████▍ | 21/25 [03:24<00:48, 12.02s/it]

User  20 Elapsed: 00:00:11


 88%|████████▊ | 22/25 [03:35<00:35, 11.76s/it]

User  21 Elapsed: 00:00:11


 92%|█████████▏| 23/25 [03:40<00:19,  9.96s/it]

User  22 Elapsed: 00:00:05
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:45<00:00,  9.03s/it]

User  24 Elapsed: 00:00:04



  4%|▍         | 1/25 [00:07<02:58,  7.44s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:40<05:50, 15.23s/it]

User  1 Elapsed: 00:00:33


 12%|█▏        | 3/25 [00:48<04:46, 13.03s/it]

User  2 Elapsed: 00:00:07


 16%|█▌        | 4/25 [00:56<03:58, 11.34s/it]

User  3 Elapsed: 00:00:07


 20%|██        | 5/25 [01:00<03:06,  9.32s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:06<02:36,  8.25s/it]

User  5 Elapsed: 00:00:05


 28%|██▊       | 7/25 [01:11<02:12,  7.34s/it]

User  6 Elapsed: 00:00:05


 32%|███▏      | 8/25 [01:16<01:49,  6.47s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:22<01:42,  6.41s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:29<01:40,  6.68s/it]

User  9 Elapsed: 00:00:07


 44%|████▍     | 11/25 [01:39<01:45,  7.51s/it]

User  10 Elapsed: 00:00:09


 48%|████▊     | 12/25 [01:48<01:46,  8.16s/it]

User  11 Elapsed: 00:00:09


 52%|█████▏    | 13/25 [01:56<01:36,  8.04s/it]

User  12 Elapsed: 00:00:07


 56%|█████▌    | 14/25 [02:08<01:40,  9.14s/it]

User  13 Elapsed: 00:00:11


 60%|██████    | 15/25 [02:16<01:29,  8.99s/it]

User  14 Elapsed: 00:00:08
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:32<01:09,  8.68s/it]

User  16 Elapsed: 00:00:15


 72%|███████▏  | 18/25 [02:53<01:26, 12.35s/it]

User  17 Elapsed: 00:00:20


 76%|███████▌  | 19/25 [03:02<01:06, 11.14s/it]

User  18 Elapsed: 00:00:08


 80%|████████  | 20/25 [03:18<01:03, 12.62s/it]

User  19 Elapsed: 00:00:16


 84%|████████▍ | 21/25 [03:28<00:48, 12.07s/it]

User  20 Elapsed: 00:00:10


 88%|████████▊ | 22/25 [03:39<00:34, 11.56s/it]

User  21 Elapsed: 00:00:10


 92%|█████████▏| 23/25 [03:44<00:19,  9.61s/it]

User  22 Elapsed: 00:00:05
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:48<00:00,  9.15s/it]

User  24 Elapsed: 00:00:04



  4%|▍         | 1/25 [00:07<02:50,  7.09s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:39<05:37, 14.68s/it]

User  1 Elapsed: 00:00:32


 12%|█▏        | 3/25 [00:47<04:37, 12.60s/it]

User  2 Elapsed: 00:00:07


 16%|█▌        | 4/25 [00:54<03:53, 11.14s/it]

User  3 Elapsed: 00:00:07


 20%|██        | 5/25 [00:58<03:00,  9.00s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:04<02:32,  8.01s/it]

User  5 Elapsed: 00:00:05


 28%|██▊       | 7/25 [01:09<02:04,  6.93s/it]

User  6 Elapsed: 00:00:04


 32%|███▏      | 8/25 [01:13<01:45,  6.19s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:19<01:39,  6.20s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:27<01:39,  6.65s/it]

User  9 Elapsed: 00:00:07


 44%|████▍     | 11/25 [01:36<01:43,  7.42s/it]

User  10 Elapsed: 00:00:09


 48%|████▊     | 12/25 [01:46<01:44,  8.03s/it]

User  11 Elapsed: 00:00:09


 52%|█████▏    | 13/25 [01:53<01:32,  7.69s/it]

User  12 Elapsed: 00:00:06


 56%|█████▌    | 14/25 [02:03<01:32,  8.45s/it]

User  13 Elapsed: 00:00:10


 60%|██████    | 15/25 [02:11<01:23,  8.36s/it]

User  14 Elapsed: 00:00:08
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:27<01:05,  8.23s/it]

User  16 Elapsed: 00:00:15


 72%|███████▏  | 18/25 [02:46<01:20, 11.47s/it]

User  17 Elapsed: 00:00:19


 76%|███████▌  | 19/25 [02:54<01:03, 10.53s/it]

User  18 Elapsed: 00:00:08


 80%|████████  | 20/25 [03:10<01:00, 12.20s/it]

User  19 Elapsed: 00:00:16


 84%|████████▍ | 21/25 [03:21<00:47, 11.78s/it]

User  20 Elapsed: 00:00:10


 88%|████████▊ | 22/25 [03:31<00:33, 11.28s/it]

User  21 Elapsed: 00:00:10


 92%|█████████▏| 23/25 [03:37<00:19,  9.53s/it]

User  22 Elapsed: 00:00:05
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:41<00:00,  8.85s/it]

User  24 Elapsed: 00:00:04



  4%|▍         | 1/25 [00:07<02:50,  7.10s/it]

User  0 Elapsed: 00:00:07


  8%|▊         | 2/25 [00:38<05:32, 14.48s/it]

User  1 Elapsed: 00:00:31


 12%|█▏        | 3/25 [00:46<04:31, 12.35s/it]

User  2 Elapsed: 00:00:07


 16%|█▌        | 4/25 [00:53<03:49, 10.93s/it]

User  3 Elapsed: 00:00:07


 20%|██        | 5/25 [00:58<02:58,  8.93s/it]

User  4 Elapsed: 00:00:04


 24%|██▍       | 6/25 [01:03<02:32,  8.02s/it]

User  5 Elapsed: 00:00:05


 28%|██▊       | 7/25 [01:08<02:08,  7.13s/it]

User  6 Elapsed: 00:00:05


 32%|███▏      | 8/25 [01:13<01:46,  6.29s/it]

User  7 Elapsed: 00:00:04


 36%|███▌      | 9/25 [01:19<01:40,  6.30s/it]

User  8 Elapsed: 00:00:06


 40%|████      | 10/25 [01:27<01:39,  6.64s/it]

User  9 Elapsed: 00:00:07


 44%|████▍     | 11/25 [01:36<01:45,  7.52s/it]

User  10 Elapsed: 00:00:09


 48%|████▊     | 12/25 [01:45<01:44,  8.01s/it]

User  11 Elapsed: 00:00:09


 52%|█████▏    | 13/25 [01:53<01:33,  7.81s/it]

User  12 Elapsed: 00:00:07


 56%|█████▌    | 14/25 [02:04<01:37,  8.86s/it]

User  13 Elapsed: 00:00:11


 60%|██████    | 15/25 [02:13<01:28,  8.81s/it]

User  14 Elapsed: 00:00:08
User  15 Elapsed: 00:00:00


 68%|██████▊   | 17/25 [02:28<01:08,  8.50s/it]

User  16 Elapsed: 00:00:15


 72%|███████▏  | 18/25 [02:47<01:22, 11.72s/it]

User  17 Elapsed: 00:00:19


 76%|███████▌  | 19/25 [02:56<01:05, 10.90s/it]

User  18 Elapsed: 00:00:08


 80%|████████  | 20/25 [03:13<01:02, 12.54s/it]

User  19 Elapsed: 00:00:16


 84%|████████▍ | 21/25 [03:24<00:48, 12.08s/it]

User  20 Elapsed: 00:00:10


 88%|████████▊ | 22/25 [03:33<00:33, 11.26s/it]

User  21 Elapsed: 00:00:09


 92%|█████████▏| 23/25 [03:37<00:18,  9.09s/it]

User  22 Elapsed: 00:00:04
User  23 Elapsed: 00:00:00


100%|██████████| 25/25 [03:41<00:00,  8.88s/it]

User  24 Elapsed: 00:00:04





In [206]:
table_path = '../tables/critiquing/multi_step_critiquing/yelp/ranksvm/'
name = 'ranksvm2test.csv'
# save_dataframe_csv(df, table_path, name)
df = load_dataframe_csv(table_path,name)

In [243]:
def avg_successful_rate(df):
    num_runs = len(np.where(df['iteration'] == 0)[0])
    num_success = len(np.where(df['result'] == 'successful')[0])
    
    return num_success/num_runs
def avg_length(df,include_fail = True):
    num_runs = len(np.where(df['iteration'] == 0)[0])
    return (len(df)-num_runs)/num_runs

In [267]:
# df_5 =  df[df['target_rank'] == 5]
# df_10 = df[df['target_rank'] == 10]
df_20 = df[df['target_rank'] == 20]
df_50 = df[df['target_rank'] == 50]

In [245]:
# Ranksvm 1 50 users 20 topaffected lamb = 5
print (avg_length(df_20))
print (avg_successful_rate(df_20))
print (avg_length(df_50))
print (avg_successful_rate(df_50))

18.271084337349397
0.10090361445783133
16.94277108433735
0.1822289156626506


In [239]:
# Ranksvm2 50 users 20topaffected lamb = 5
print (avg_length(df_20))
print (avg_successful_rate(df_20))
print (avg_length(df_50))
print (avg_successful_rate(df_50))

18.370481927710845
0.09789156626506024
17.049698795180724
0.17620481927710843


In [268]:
# Ranksvm2 50 users 20topaffected lamb = 100, range = -100to100
print (avg_length(df_20))
print (avg_successful_rate(df_20))
print (avg_length(df_50))
print (avg_successful_rate(df_50))

18.13102409638554
0.11897590361445783
16.673192771084338
0.21234939759036145


In [252]:
# Avg
print (avg_length(df_20))
print (avg_successful_rate(df_20))
print (avg_length(df_50))
print (avg_successful_rate(df_50))

16.003012048192772
0.2756024096385542
14.045180722891565
0.39457831325301207


In [219]:
# Ranksvm 2 bot 20 affected
print (avg_length(df_20))
print (avg_successful_rate(df_20))
print (avg_length(df_50))
print (avg_successful_rate(df_50))

20.0
0.0
19.08888888888889
0.06666666666666667


In [290]:
# Rating obj
print (avg_length(df_20))
print (avg_successful_rate(df_20))
print (avg_length(df_50))
print (avg_successful_rate(df_50))

19.377777777777776
0.08888888888888889
18.88888888888889
0.15555555555555556


In [258]:
# top20items
print (avg_length(df_20))
print (avg_successful_rate(df_20))
print (avg_length(df_50))
print (avg_successful_rate(df_50))

18.466666666666665
0.15555555555555556
17.177777777777777
0.26666666666666666
