In [1]:
%load_ext autoreload
%autoreload 2

In [2]:
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np
import os
from pulp import *
from copy import deepcopy
while "notebooks" in os.getcwd():
    os.chdir("..")

from src.preprocessing.parser import Parser
from src.preprocessing.preprocessor import Preprocessor
from src.solvers.solution import Solution
from src.solvers.greedy import GreedySolver
from src.solvers.pulp_solver import PuLPSolver
from src.solvers.dp import DPSolver
from src.solvers.base_solver import DPMethods

from time import time
from tqdm import tqdm
from typing import Dict

Pyarrow will become a required dependency of pandas in the next major release of pandas (pandas 3.0),
(to allow more performant data types, such as the Arrow string type, and better interoperability with other libraries)
but was not found to be installed on your system.
If this would cause problems for you,
please provide us feedback at https://github.com/pandas-dev/pandas/issues/54466
        
  import pandas as pd


In [3]:
def get_num_triples(dataset : Dict):
    num_triples= 0
    for n in dataset.keys():
        num_triples += len(dataset[n])
    
    return num_triples

## Test 05

In [4]:
parser = Parser("data/testfiles/test5.txt")

In [5]:
t0 = time()
info = parser.read()
t1 = time()

print(f"Total execution time {t1 - t0} s")

1204it [00:00, 118445.93it/s]


Total execution time 0.23374509811401367 s


In [6]:
dataset : Dict[int, pd.DataFrame ]= info['data']
p, K, M, N = info['p'], info['K'], info['M'], info['N']

In [7]:
preprocessing_results = {}
preprocessor = Preprocessor(
    K, 
    M,
    N,
    p,
    dataset
)

t0 = time()

data_1 = preprocessor.remove_trivial_values()
t1 = time()

preprocessing_results['remove trivial values'] = {
    "runtime": (t1 - t0),
    "num_triples": get_num_triples(data_1)
}
t1 = time()

data_2 = preprocessor.remove_ip_dominated(dataset)
t2 = time()
preprocessing_results['remove IP dominated'] = {
    "runtime": t2-t1,
    "num_triples": get_num_triples(data_2)
}
t2 = time()

data_3 = preprocessor.remove_lp_dominated(data_2)
t3 = time()
preprocessing_results['remove LP dominated'] = {
    "runtime": t3-t2,
    "num_triples": get_num_triples(data_3)
}


100%|██████████| 40/40 [00:00<00:00, 7141.37it/s]


100%|██████████| 40/40 [00:00<00:00, 40.40it/s]
100%|██████████| 40/40 [00:00<00:00, 354.99it/s]


In [8]:
pd.DataFrame(preprocessing_results)

Unnamed: 0,remove trivial values,remove IP dominated,remove LP dominated
runtime,0.440886,0.995682,0.410841
num_triples,1954.0,329.0,193.0


## Greedy algorithm

In [9]:
lp_results = {}

In [10]:
pulp_solver = PuLPSolver(
    K, 
    M,
    N,
    p,
    data_3
)

t1 = time()
pulp_solver.solve()
t2 = time()

lp_results['pulp'] = {
    'runtime': t2-t1,
    'data_rate' : pulp_solver.solution.objective.value()
}

Welcome to the CBC MILP Solver 
Version: 2.10.3 
Build Date: Dec 15 2019 

command line - /home/pedro/anaconda3/envs/user-scheduling-in-5g/lib/python3.12/site-packages/pulp/solverdir/cbc/linux/64/cbc /tmp/6f1618cbee68414b910bd23f7de00ea5-pulp.mps -max -timeMode elapsed -branch -printingOptions all -solution /tmp/6f1618cbee68414b910bd23f7de00ea5-pulp.sol (default strategy 1)
At line 2 NAME          MODEL
At line 3 ROWS
At line 46 COLUMNS
At line 626 RHS
At line 668 BOUNDS
At line 862 ENDATA
Problem MODEL has 41 rows, 193 columns and 386 elements
Coin0008I MODEL read with 0 errors
Option for timeMode changed from cpu to elapsed
Presolve 41 (0) rows, 193 (0) columns and 386 (0) elements
0  Obj -0 Primal inf 63.67607 (40) Dual inf 12876.888 (193)
30  Obj 1637
Optimal - objective value 1637
Optimal objective 1637 - 30 iterations time 0.002
Option for printingOptions changed from normal to all
Total time (CPU seconds):       0.00   (Wallclock seconds):       0.00



In [11]:
solver = GreedySolver(
    K, 
    M,
    N,
    p,
    data_3
)

t1 = time()
solver.solve(data_3)
t2 = time()

lp_results['greedy'] = {
    'runtime': t2-t1,
    'data_rate' : solver.solution.get_data_rate()
}


In [12]:
pd.DataFrame(lp_results)

Unnamed: 0,pulp,greedy
runtime,0.011698,0.151701
data_rate,1637.0,1637.0


## Solutions to the ILP

In [13]:
ilp_results = {}

In [14]:
dp_solver = DPSolver(
    K, 
    M,
    N,
    p,
    data_3
)

t1 = time()
dp_solver.solve(
    None,
    method = DPMethods.MAXIMIZE_R
)
t2 = time()
ilp_results['DP_maximize_r'] = {
    'runtime' : t2 - t1,
    "data_rate" : dp_solver.solution.get_data_rate()
}

pulp_solver.solve()
U = int(pulp_solver.solution.objective.value())

t1 = time()
dp_solver.solve(
    None,
    method = DPMethods.MINIMIZE_P,
    U = U
)
t2 = time()

ilp_results['DP_minimize_p'] = {
    'runtime' : t2 - t1,
    "data_rate" : dp_solver.solution.get_data_rate()
}

Welcome to the CBC MILP Solver 
Version: 2.10.3 
Build Date: Dec 15 2019 

command line - /home/pedro/anaconda3/envs/user-scheduling-in-5g/lib/python3.12/site-packages/pulp/solverdir/cbc/linux/64/cbc /tmp/1ed826a5cf77459ebdafa4fa5d6a9817-pulp.mps -max -timeMode elapsed -branch -printingOptions all -solution /tmp/1ed826a5cf77459ebdafa4fa5d6a9817-pulp.sol (default strategy 1)
At line 2 NAME          MODEL
At line 3 ROWS
At line 46 COLUMNS
At line 626 RHS
At line 668 BOUNDS
At line 862 ENDATA
Problem MODEL has 41 rows, 193 columns and 386 elements
Coin0008I MODEL read with 0 errors
Option for timeMode changed from cpu to elapsed
Presolve 41 (0) rows, 193 (0) columns and 386 (0) elements
0  Obj -0 Primal inf 63.67607 (40) Dual inf 12876.888 (193)
30  Obj 1637
Optimal - objective value 1637
Optimal objective 1637 - 30 iterations time 0.002
Option for printingOptions changed from normal to all
Total time (CPU seconds):       0.00   (Wallclock seconds):       0.00



In [15]:
pd.DataFrame(ilp_results)

Unnamed: 0,DP_maximize_r,DP_minimize_p
runtime,0.18046,0.23112
data_rate,1637.0,1637.0
