# Toy example for Radix-based for multiple conditions

In [1]:
SCALE_CROWDING=False
PREVENT_ZERO = True

In [2]:
%load_ext line_profiler

In [3]:
from gurobipy import *

import seaborn as sns
import pandas as pd
import matplotlib.pyplot as plt
import numpy as np

plt.rcParams['svg.fonttype'] = 'none'
pd.set_option('display.max_colwidth', -1)
%matplotlib inline

from dynamicme.decomposition import Decomposer
from dynamicme.callback_gurobi import cb_benders
from dynamicme.optimize import Optimizer, StackOptimizer
from dynamicme.optimize import Constraint, Variable

from cobra.io import load_json_model
from cobra import Metabolite, Reaction
from six import iteritems

import numpy as np
import cobra

(<type 'exceptions.ImportError'>, ImportError('No module named cplex',), <traceback object at 0x7fadcaf0ef80>)


### Try optimizing using radix for one condition first

In [88]:
#----------------------------------------
# Starting from basal model
ijomc = load_json_model('/home/laurence/ME/models/BiGG_M/json/e_coli_core.json')
mdl_ref = ijomc
keff0 = 1./65/3600
#crowding_bound = 0.0003
crowding_bound0 = 0.001
crowding_bound = crowding_bound0

not_crowded = ['ATPM']
rxns_c = [r for r in ijomc.reactions if all([m.compartment=='c' for m in r.metabolites.keys()]) and 'BIOMASS' not in r.id and r.id not in not_crowded]
crowding_dict = {rxn:keff0 for rxn in rxns_c}
#----------------------------------------

# Temporarily add crowding constraint for the duality gap constraint
crowding = Constraint('crowding')
crowding._bound = crowding_bound
crowding._constraint_sense = 'L'
for rxn,keff in iteritems(crowding_dict):
    rxn.add_metabolites({crowding:keff})

In [5]:
ijomc.optimize()
mu_crowd0 = ijomc.reactions.BIOMASS_Ecoli_core_w_GAM.x
print(mu_crowd0)

0.873921506968


In [98]:
#N_CONDS = 2

df_meas = pd.read_csv('/home/laurence/ME/data/dynamicME/beg/growth_meas.csv')
ex_rxns = [r for r in df_meas.ex_rxn.unique() if mdl_ref.reactions.has_id(r)]
df_meas = df_meas[ df_meas.ex_rxn.isin(ex_rxns)]
conds = df_meas.substrate.unique()
df_conds = pd.DataFrame([{'cond':r['substrate'], 'rxn':ex_rxn, 'lb':-10 if r['ex_rxn']==ex_rxn else 0, 'ub':1000., 'obj':0.} for i,r in df_meas.iterrows() for ex_rxn in ex_rxns])
df_conds = df_conds[ df_conds.cond.isin(conds[0:N_CONDS])]

In [7]:
stacker = StackOptimizer()
stacker.stack_models(ijomc, df_conds)

In [8]:
stacker.model.optimize(solver='gurobi')

<Solution 1.75 at 0x7fad6ac87c90>

In [9]:
stacker.model_dict['fructose'].optimize()

<Solution 0.87 at 0x7fad6ac87990>

In [10]:
stacker.model_dict['glucose'].optimize()
print stacker.model_dict['glucose'].reactions.query('BIOMASS')[0].x
print stacker.model_dict['glucose'].reactions.query('EX_glc')[0].x
print stacker.model_dict['glucose'].reactions.query('EX_fru')[0].x

0.873921506968
-10.0
0.0


In [11]:
stacker.model_dict['fructose'].optimize()
print stacker.model_dict['fructose'].reactions.query('BIOMASS')[0].x
print stacker.model_dict['fructose'].reactions.query('EX_glc')[0].x
print stacker.model_dict['fructose'].reactions.query('EX_fru')[0].x

0.873921506966
0.0
-10.0


In [12]:
for mdl_ind,mdl in iteritems(stacker.model_dict):
    opt = Optimizer(mdl)
    gapi = opt.add_duality_gap_constraint(INF=1e3, inplace=True, index=mdl_ind)

In [13]:
stacker.model.optimize(solver='gurobi')

<Solution 3.50 at 0x7fae0ce1ce50>

In [14]:
import numpy as np

radix = 2.
print('Radix:',radix)
powers = np.arange(-3,4)
print('Powers:', powers)
digits_per_power = radix
pwr_max = max(powers)
digits = list(set(np.linspace(1, radix-1, digits_per_power)))
print('Digits:', digits)

# Discretize crowding coefficients into radix
#crowding_p = gap.metabolites.crowding
#crowding_cons = stacker.model.metabolites.query('crowding')

var_cons_dict = {}
# Get the group ID from reference model
mdl_ref = ijomc
crowding_ref = mdl_ref.metabolites.crowding
for rxn_ref in crowding_ref.reactions:    
    for mdl_ind, mdl in iteritems(stacker.model_dict):
        crowding_p = mdl.metabolites.get_by_id('crowding_%s'%mdl_ind)
        var_d = mdl.reactions.get_by_id('wa_%s'%crowding_p.id)
        rxn_p = mdl.reactions.get_by_id(rxn_ref.id+'_%s'%mdl_ind)
        # Get the coefficient in the dual
        cons_ds = [m for m in var_d.metabolites.keys() if rxn_p.id==m.id]        
        a0 = rxn_p.metabolites[crowding_p]
        if var_cons_dict.has_key(rxn_ref.id):
            var_cons_dict[rxn_ref.id] += [(rxn_p, crowding_p, a0)] + [(var_d, cons_d, a0) for cons_d in cons_ds]
        else:
            var_cons_dict[rxn_ref.id] = [(rxn_p, crowding_p, a0)] + [(var_d, cons_d, a0) for cons_d in cons_ds]

('Radix:', 2.0)
('Powers:', array([-3, -2, -1,  0,  1,  2,  3]))
('Digits:', [1.0])




In [15]:
# %lprun -f opt.to_radix opt.to_radix(gap, var_cons_dict, radix, powers, digits_per_power, prevent_zero=True)

In [16]:
%time opt.to_radix(stacker.model, var_cons_dict, radix, powers, digits=digits, prevent_zero=PREVENT_ZERO)

CPU times: user 210 ms, sys: 22.6 ms, total: 232 ms
Wall time: 213 ms


[1.0]

In [17]:
relaxed = ['PGK','GLUDy','PGM','PGI','RPI']
for rel in relaxed:
    try:
        cons_id = 'force_nonzero_%s'%rel
        cons = stacker.model.metabolites.get_by_id(cons_id)
        cons._bound = 0.
    except KeyError:
        print('Skipping non-existent constraint: %s' % cons_id)

### Try scaling
if SCALE_CROWDING:
    crowding = stacker.model.metabolites.crowding
    bound0  = crowding._bound
    f_scale = crowding._bound
    crowding._bound = bound0 / f_scale
    for rxn in crowding.reactions:
        rxn._metabolites[crowding] = rxn._metabolites[crowding]/f_scale

In [18]:
for rxn in stacker.model.reactions:
    rxn.objective_coefficient = 0.
for rxn in stacker.model.reactions.query('binary'):
    rxn.objective_coefficient = 1.

In [27]:
milp.Status

11

In [28]:
milp.SolCount

0

In [47]:
from cobra.solvers import gurobi_solver
from gurobipy import *

F_TOL_FINAL = 0.02
F_TOL_START = 1.
N_FS =11
F_TOLS = np.linspace(F_TOL_START, F_TOL_FINAL, N_FS)
F_TOLS

array([1.   , 0.902, 0.804, 0.706, 0.608, 0.51 , 0.412, 0.314, 0.216,
       0.118, 0.02 ])

### TOOD: bisection on F_TOL instead of linear

In [None]:
%%time

mu_id = 'BIOMASS_Ecoli_core_w_GAM'
sol_dict = {}
for ind, F_TOL in enumerate(F_TOLS):
    for mdl_ind,mdl in iteritems(stacker.model_dict):
        mu_meas = df_meas[ df_meas.substrate==mdl_ind].growth_rate_1_h.iloc[0]
        rxn_mu = mdl.reactions.get_by_id(mu_id+'_%s'%mdl_ind)    
        rxn_mu.lower_bound = mu_meas*(1-F_TOL)
        rxn_mu.upper_bound = mu_meas*(1+F_TOL)
        mu_crowd0 = np.nan
        print('Condition=%s. Initial mu_crowd=%g. Fitting within %g%% of measured: %g <= mu <= %g' % (mdl_ind, mu_crowd0, 100*F_TOL, rxn_mu.lower_bound, rxn_mu.upper_bound))

    # If feasible solution found, use it as MILP start
    if milp.SolCount > 0:
        print('#'*40)
        print('Setting MIP warm-start values.')
        for v in milp.getVars():
            v.Start = v.X
        sol_dict[ind] = {'x_dict':{v.VarName:v.X for v in milp.getVars()}, 'F_TOL':F_TOL}

    milp = gurobi_solver.create_problem(stacker.model)
    milp.ModelSense = GRB.MINIMIZE
    milp.Params.IntFeasTol = 1e-9
    milp.Params.OutputFlag = 1
    # milp.Params.FeasibilityTol = 1e-9
    # milp.Params.OptimalityTol = 1e-9
    milp.Params.NodefileStart = 3   # Start writing nodes to disk if x GB RAM exceeded (for each thread)
    milp.Params.TimeLimit = 2*3600  # Time limit in seconds

    milp.optimize()

Condition=fructose. Initial mu_crowd=nan. Fitting within 100% of measured: 0 <= mu <= 1.1
Condition=glucose. Initial mu_crowd=nan. Fitting within 100% of measured: 0 <= mu <= 1.48
Changed value of parameter OutputFlag to 1
   Prev: 0  Min: 0  Max: 1  Default: 1
Changed value of parameter NodefileStart to 3.0
   Prev: 1e+100  Min: 0.0  Max: 1e+100  Default: 1e+100
Changed value of parameter TimeLimit to 7200.0
   Prev: 1e+100  Min: 0.0  Max: 1e+100  Default: 1e+100
Optimize a model with 6098 rows, 2396 columns and 16584 nonzeros
Variable types: 2060 continuous, 336 integer (0 binary)
Coefficient statistics:
  Matrix range     [5e-07, 1e+03]
  Objective range  [1e+00, 1e+00]
  Bounds range     [1e+00, 1e+03]
  RHS range        [1e-03, 1e+03]
Presolve removed 1959 rows and 345 columns
Presolve time: 0.03s
Presolved: 4139 rows, 2051 columns, 12258 nonzeros
Variable types: 1715 continuous, 336 integer (336 binary)

Root relaxation: objective 4.300000e+01, 2237 iterations, 0.08 seconds

    

In [52]:
[(k, s['F_TOL']) for k,s in iteritems(sol_dict)]

[(1, 0.902),
 (2, 0.804),
 (3, 0.706),
 (4, 0.608),
 (5, 0.51),
 (6, 0.4119999999999999),
 (7, 0.31399999999999995),
 (8, 0.21599999999999997),
 (9, 0.118)]

In [54]:
len(sol_dict[9]['x_dict'])

2396

In [55]:
len(stacker.model.reactions)

2396

In [61]:
best_ind = len(sol_dict)
best_ind

9

In [67]:
x_dict = {r.id:sol_dict[best_ind]['x_dict'][str(i)] for i,r in enumerate(stacker.model.reactions)}
F_TOL = sol_dict[best_ind]['F_TOL']

In [69]:
df_meas.head()

Unnamed: 0,substrate,growth_rate_1_h,order,ex_rxn
0,glucose,0.74,0.0,EX_glc__D_e
3,fructose,0.55,,EX_fru_e
5,succinate,0.46,,EX_succ_e
6,malate,0.44,,EX_mal__L_e
9,acetate,0.256,5.0,EX_ac_e


In [76]:
#sol = gurobi_solver.format_solution(milp, stacker.model)
#yopt = [sol.x_dict[rxn.id] for rxn in stacker.model.reactions.query('binary_')]
yopt = [x_dict[rxn.id] for rxn in stacker.model.reactions.query('binary_')]
print('Number of non-zero binaries: %g' % sum(yopt))
for mdl_ind,mdl in iteritems(stacker.model_dict):
    dfi = df_meas[ df_meas.substrate==mdl_ind]
    mu_measi = dfi.growth_rate_1_h.iloc[0]
    rxn_mu = stacker.model.reactions.get_by_id(mu_id+'_%s'%mdl_ind)
    muopt = x_dict[rxn_mu.id]
    muL = mu_measi*(1-F_TOL)
    muU = mu_measi*(1+F_TOL)
    print('Initial mu_crowd=%g. Fitted within %g%%: %g <= %g <= %g' % (mu_crowd0, 100*F_TOL, muL, muopt, muU))

Number of non-zero binaries: 43
Initial mu_crowd=nan. Fitted within 11.8%: 0.4851 <= 0.64862 <= 0.6149
Initial mu_crowd=nan. Fitted within 11.8%: 0.65268 <= 0.64862 <= 0.82732


In [83]:
# Fitted parameters
kfit_dict = {}
for group_id, var_dict in iteritems(var_cons_dict):
    var = var_dict[0]
    cons = var_dict[1]
    a0  = var_dict[0][2]
    kfit = 0.
    for l,pwr in enumerate(powers):
        for k,digit in enumerate(digits):            
            yid = 'binary_%s%s%s' % (group_id,k,l)
            y   = x_dict[yid]            
            if abs(y)>1e-10:
                print('%s. Value=%s. Power=%g. Digit=%g' % (yid, y, pwr, digit))
#                 print yid, y
#             if abs(y)<1e-10:
#                 print yid, y
                pass
            kfit += y*a0*radix**pwr*digit
    kfit_dict[group_id] = kfit

binary_G6PDH2r00. Value=1.0. Power=-3. Digit=1
binary_AKGDH06. Value=1.0. Power=3. Digit=1
binary_ACKr02. Value=1.0. Power=-1. Digit=1
binary_GLUN05. Value=1.0. Power=2. Digit=1
binary_ME100. Value=1.0. Power=-3. Digit=1
binary_GND03. Value=1.0. Power=0. Digit=1
binary_ME204. Value=1.0. Power=1. Digit=1
binary_GLNS05. Value=1.0. Power=2. Digit=1
binary_FUM05. Value=1.0. Power=2. Digit=1
binary_SUCDi01. Value=1.0. Power=-2. Digit=1
binary_PPC06. Value=1.0. Power=3. Digit=1
binary_MDH05. Value=1.0. Power=2. Digit=1
binary_GLUSy02. Value=1.0. Power=-1. Digit=1
binary_PGL00. Value=1.0. Power=-3. Digit=1
binary_ACALD00. Value=1.0. Power=-3. Digit=1
binary_MALS01. Value=1.0. Power=-2. Digit=1
binary_ADK106. Value=1.0. Power=3. Digit=1
binary_PPS06. Value=1.0. Power=3. Digit=1
binary_PTAr06. Value=1.0. Power=3. Digit=1
binary_RPE00. Value=1.0. Power=-3. Digit=1
binary_ALCD2x04. Value=1.0. Power=1. Digit=1
binary_PPCK06. Value=1.0. Power=3. Digit=1
binary_TALA06. Value=1.0. Power=3. Digit=1
bi

In [84]:
[(k,v) for k,v in iteritems(kfit_dict) if abs(v)>1e-10]

[(u'G6PDH2r', 5.341880341880342e-07),
 (u'AKGDH', 3.418803418803419e-05),
 (u'ACKr', 2.136752136752137e-06),
 (u'MALS', 1.0683760683760685e-06),
 (u'GLUN', 1.7094017094017095e-05),
 (u'ME1', 5.341880341880342e-07),
 (u'GND', 4.273504273504274e-06),
 (u'ME2', 8.547008547008548e-06),
 (u'GLNS', 1.7094017094017095e-05),
 (u'ADK1', 3.418803418803419e-05),
 (u'SUCDi', 1.0683760683760685e-06),
 (u'PPC', 3.418803418803419e-05),
 (u'MDH', 1.7094017094017095e-05),
 (u'FUM', 1.7094017094017095e-05),
 (u'GLUSy', 2.136752136752137e-06),
 (u'PGL', 5.341880341880342e-07),
 (u'ACALD', 5.341880341880342e-07),
 (u'PPS', 3.418803418803419e-05),
 (u'PTAr', 3.418803418803419e-05),
 (u'RPE', 5.341880341880342e-07),
 (u'ALCD2x', 8.547008547008548e-06),
 (u'TALA', 3.418803418803419e-05),
 (u'NADTRHD', 8.547008547008548e-06),
 (u'ICDHyr', 3.418803418803419e-05),
 (u'GAPD', 3.418803418803419e-05),
 (u'ICL', 1.0683760683760685e-06),
 (u'TPI', 2.136752136752137e-06),
 (u'ENO', 5.341880341880342e-07),
 (u'ACONTa'

### Plug back in to be sure

In [89]:
df_conds

Unnamed: 0,cond,lb,obj,rxn,ub
0,glucose,-10,0.0,EX_glc__D_e,1000.0
1,glucose,0,0.0,EX_fru_e,1000.0
2,glucose,0,0.0,EX_succ_e,1000.0
3,glucose,0,0.0,EX_mal__L_e,1000.0
4,glucose,0,0.0,EX_ac_e,1000.0
5,fructose,0,0.0,EX_glc__D_e,1000.0
6,fructose,-10,0.0,EX_fru_e,1000.0
7,fructose,0,0.0,EX_succ_e,1000.0
8,fructose,0,0.0,EX_mal__L_e,1000.0
9,fructose,0,0.0,EX_ac_e,1000.0


In [95]:
#----------------------------------------
# Starting from basal model
csrcs = df_conds.cond.unique()
for csrc in csrcs:
    ijofit = load_json_model('/home/laurence/ME/models/BiGG_M/json/e_coli_core.json')    
    crowding = Constraint('crowding')
    crowding._bound = crowding_bound0
    crowding._constraint_sense = 'L'
    
    df_condi = df_conds[ df_conds.cond==csrc]    
    for i,row in df_condi.iterrows():
        rid = row['rxn']
        rxn = ijofit.reactions.get_by_id(rid)
        rxn.lower_bound = row['lb']
        rxn.upper_bound = row['ub']

    for rid,kfit in iteritems(kfit_dict):
        rxn = ijofit.reactions.get_by_id(rid)
        rxn.add_metabolites({crowding:kfit})
    
    ijofit.optimize()
    
    mu_measi = df_meas[ df_meas.substrate==csrc].growth_rate_1_h.iloc[0]
    
    print('Cond=%s. mu_meas=%g. mu_sim=%g' % (csrc, mu_measi, ijofit.reactions.BIOMASS_Ecoli_core_w_GAM.x))    
    for i,row in df_condi.iterrows():
        rid = row['rxn']
        rxn = ijofit.reactions.get_by_id(rid)        
        print('\t%s uptake=%g' % (rxn.id, rxn.x))

Cond=glucose. mu_meas=0.74. mu_sim=0.64862
	EX_glc__D_e uptake=-7.76293
	EX_fru_e uptake=0
	EX_succ_e uptake=0
	EX_mal__L_e uptake=0
	EX_ac_e uptake=0
Cond=fructose. mu_meas=0.55. mu_sim=0.64862
	EX_glc__D_e uptake=0
	EX_fru_e uptake=-7.76293
	EX_succ_e uptake=0
	EX_mal__L_e uptake=0
	EX_ac_e uptake=0
