In [140]:
import jax
from typing import Any, Callable, Sequence, Optional
from jax import lax, random, numpy as jnp
import flax
from flax import linen as nn
import sympy as sy
import numpy as np
import sys
sys.path.append("..")
from eql.eqlearner import EQL
from eql.symbolic import get_symbolic_expr, get_symbolic_expr_layer
from typing import List, Tuple, Callable
from functools import partial
import matplotlib.pyplot as plt
import scipy
sys.path.append("../../orient")
import optax
from functools import partial
from np_utils import flatten, unflatten

In [None]:
res = optimize_fire2(flat, energy, denergy, 0, logoutput=True)

8.441594 7.3435097
7.9098506 7.082759
7.6405 6.3421297
7.7673855 7.1826224
6.8366804 4.0830526
8.079469 4.6451917
7.725611 6.1240664
7.829009 4.527977
7.89986 4.5692663
7.763454 4.4965067
7.6107664 6.500814
7.7400956 6.317418
7.6105566 6.2703915
8.051039 7.0288496
7.3090844 4.959175
7.398381 5.300519
7.594365 7.1884995
7.6099224 5.8791895
7.650319 4.450931
7.2316356 6.0811625
6.9884067 5.246252
7.2901783 5.439336
7.043942 4.428419
7.0351305 6.154442
6.165093 4.1963377
6.544695 3.9341245
6.095541 3.5944333
6.1543016 3.6871386
5.663496 3.2503273
5.5035853 3.22661
5.2340283 2.9075613
4.943011 2.6520967
4.888158 2.7203648
4.2479486 2.7732327
4.073559 2.1792355
4.216922 2.9972115
3.6898308 1.7506588
3.9049366 6.0022764
3.2461581 1.3068101
3.3518028 4.1476326
3.3000906 4.0439053
3.213431 3.9721785
2.8873794 1.6780674
2.793352 0.7450148
2.715638 0.9330512
2.6977382 0.49766016
2.7313676 1.347295
2.7248657 0.86542416
2.657665 0.23280324
2.6693444 0.3723662
2.7528405 1.5595413
2.669566 0.565204


In [228]:
" Global variables for the FIRE algorithm"
alpha0 = 0.1
Ndelay = 5
Nmax = 400
finc = 1.1
fdec = 0.5
fa = 0.99
Nnegmax = 2000

#@partial(jax.jit, static_argnums=[1,2,3,4,5,6])
def optimize_fire(x0,f,df,params,atol=1e-4,dt = 0.002,logoutput=False):
    error = 10*atol 
    dtmax = 10*dt
    dtmin = 0.02*dt
    alpha = alpha0
    Npos = 0

    x = x0.copy()
    V = jnp.zeros(x.shape)
    F = -df(x,params)

    for i in range(Nmax):

        P = (F*V).sum() # dissipated power
        
        if (P>0.0):
            Npos = Npos + 1
            if Npos>Ndelay:
                dt = min(dt*finc,dtmax)
                alpha = alpha*fa
        else:
            Npos = 0
            dt = max(dt*fdec,dtmin)
            alpha = alpha0
            V = jnp.zeros(x.shape)

        V = V + 0.5*dt*F
        V = (1-alpha)*V + alpha*F*jnp.linalg.norm(V)/jnp.linalg.norm(F)
        x = x + dt*V
        F = -df(x,params)
        V = V + 0.5*dt*F

        error = max(abs(F))
        if error < atol: break

        if logoutput: print(f(x,params),error)

    del V, F  
    return [x,f(x,params),i]

def optimize_fire2(x0,f,df,params,atol=1e-4,dt = 0.002,logoutput=False):
    error = 10*atol 
    dtmax = 10*dt
    dtmin = 0.02*dt
    alpha = alpha0
    Npos = 0
    Nneg = 0
    key = jax.random.PRNGKey(1)

    x = x0.copy()
    V = jnp.zeros(x.shape)
    F = -df(x,params, key)

    for i in range(Nmax):
        key, _ = jax.random.split(key)
        P = (F*V).sum() # dissipated power
        
        if (P>0):
            Npos = Npos + 1
            Nneg = 0
            if Npos>Ndelay:
                dt = min(dt*finc,dtmax)
                alpha = alpha*fa
        else:
            Npos = 0
            Nneg = Nneg + 1
            if Nneg > Nnegmax: break
            if i> Ndelay:
                dt = max(dt*fdec,dtmin)
                alpha = alpha0
            x = x - 0.5*dt*V
            V = jnp.zeros(x.shape)
            
        V = V + 0.5*dt*F
        V = (1-alpha)*V + alpha*F*jnp.linalg.norm(V)/jnp.linalg.norm(F)
        x = x + dt*V
        F = -df(x,params, key)
        V = V + 0.5*dt*F

        error = max(abs(F))
        if error < atol: break

        if logoutput: print(f(x,params, key),error)

    del V, F  
    return [x,f(x,params, key),i]

In [227]:
spec, flat = flatten(params)

In [221]:
@jax.jit
def energy(x, params, key):
    return mse_fn(unflatten(spec, x), key)

denergy = jax.jit(jax.grad(energy))

In [222]:
funs = ['mul', 'cos', 'sin', 'exp', 'square']*2
e = EQL(n_layers=2, functions=funs, features=1, use_l0=True, drop_rate=0.03)
key = random.PRNGKey(0)

In [223]:
N = 10000
xdim = 3
x = (random.uniform(key, (N, xdim))-.5) * 3

y = x[:,0] + jnp.cos(x[:,1]) - 4.2*jnp.exp(-x[:,2]**2)
#y = jnp.cos(x) + 1 - x**2 

In [224]:
#params = e.init({'params':key}, x)
params = e.init({'params':key, 'l0': key}, x);

In [225]:
def mse_fn(params, key):
    pred = e.apply(params, x, rngs={'l0': key})
    return jnp.mean((pred-y)**2) + 1e-3*e.apply(params, rngs={'l0': key}, method=e.l0_reg)

In [226]:
def l2_fn(params):
    return sum(
        jnp.square(w).mean() for w in jax.tree_leaves(params["params"])
    )

In [216]:
def loss(params, key):
    return mse_fn(params, key)
loss_grad_fn = jax.jit(jax.value_and_grad(loss))

In [217]:
tx = optax.adam(learning_rate=1e-2)
opt_state = tx.init(params)
loss_grad_fn = jax.jit(jax.value_and_grad(loss))

In [218]:

for i in range(1000):
    key, _ = jax.random.split(key)
    loss_val, grads = loss_grad_fn(params, key)
    updates, opt_state = tx.update(grads, opt_state)
    params = optax.apply_updates(params, updates)
    if i % 9 == 0:
        print(loss_val)

7.4362807
3.8227262
2.8572721
2.7632446
2.6407542
2.6195922
2.6266215
2.6010928
2.6209812


KeyboardInterrupt: 

In [None]:
params = unflatten(spec, res[0])

In [220]:
symb = get_symbolic_expr(params, funs, use_l0=True)[0]
print(symb)

-0.0816873162984848*(-0.151793195126471*(-0.790051938952845*x0 + 0.0100178682560767*x1 + x2 - 0.322748684408874)**2 + 0.138688459992409*(-0.185519084334373*x0 - 0.122545197606087*x1 - 0.413200706243515*x2 + 0.221919417381287)*(0.0904271304607391*x0 + 0.179359629750252*x1 - 0.298895567655563*x2 + 0.125625714659691) + 0.518965125083923*(0.031295508146286*x0 - 0.386456817388535*x1 + 0.623118996620178*x2 - 0.0815803706645966)*(0.313285291194916*x0 + 0.268061995506287*x1 + 0.383731961250305*x2 - 0.0203135889023542) - 0.126765544065272*(0.476609905121115*x0 + x1 + 0.373021288993924*x2 + 0.171137880820102)**2 + 0.0139548271878929*exp(-0.625370919704437*x0 - 0.607832014560699*x1 + 0.137379005551338*x2) + 0.40480620327261*exp(-0.186916932463646*x0 + 0.543061375617981*x1 + 0.742142677307129*x2) + 0.135304778814316*sin(0.146374300122261*x0 + 0.209242224693298*x1 + 0.0300927981734276*x2 - 0.164824962615967) + 0.550004899501801*sin(0.637856662273407*x0 - 0.367531180381775*x1 - 0.463934332132339*x2 