## Parameterize MLP 

In [1]:
import tensorflow as tf
from tensorflow.keras.models import Sequential
from tensorflow.keras.layers import Dense
from tensorflow.keras.optimizers import Adam
import pandas as pd

def mlpResult(structure):

    fishModel = Sequential()
    for index in range(len(structure)):
       if index == 0:
        fishModel.add(Dense(structure[index], input_shape = (27,), activation = "relu"))
        continue
       
       fishModel.add(Dense(structure[index], activation = "relu"))
        
     
    fishModel.add(Dense(1, activation = "linear"))
    fishModel.compile(optimizer = Adam(), loss = "mean_squared_error", metrics = ["mean_squared_error"])
    print(fishModel.summary())
    return fishModel

## Parameterize KAN

In [2]:
import torch
from kan import *
from kan.utils import create_dataset_from_data

def kanResult(Structure, GridSize):
    return KAN(width = Structure, grid = GridSize, seed = 42)


## Compare the Performance of KAN versus MLP

In [10]:
import numpy as np
from sklearn.metrics import mean_squared_error
import torch
from kan import *
from kan.utils import create_dataset_from_data


modType = []
Params = []
Layers = []
GridSize = []
Error = []

Data = pd.read_csv("mlpData.csv").drop( ["Date", "Unnamed: 0"],axis = 1)

trainData = Data[Data["Year"] < 2021]

testData = Data[Data["Year"] > 2020]

xTestData = testData.drop(["Target"], axis = 1)
yTestData = testData["Target"]
    
xMLP = trainData.drop(["Target"], axis = 1)
yMLP = trainData["Target"]

xKAN = torch.tensor(xMLP.values, dtype=torch.float32)
yKAN = torch.tensor(yMLP.values, dtype=torch.float32)
yKAN = yKAN.reshape(-1,1)

data = create_dataset_from_data(xKAN, yKAN, train_ratio = 1)

for sample in range(0,300,1):

    np.random.seed(sample)

    hidden = round(np.random.normal(loc = 3, scale = 1))
    if hidden <= 0:
        hidden = hidden * -1 + 1
        
    mlpStructure = []
    kanStructure = []
    
    for i in range(0,hidden,1):
        
        nuerons = (round(np.random.normal(loc = 25, scale = 10)))
        kanNuerons = (round(np.random.normal(loc = 4, scale = 1)))
        if nuerons <= 0:
            nuerons = nuerons * -1 + 1
            
        mlpStructure.append(nuerons)
        kanStructure.append(kanNuerons)

    kanStructure.append(1)
    kanStructure[0] = 27
        
    
    gridSize = round(np.random.normal(loc = 9, scale = 3))
    if gridSize <= 0:
        gridSize = gridSize * -1 +1

    mlpParams = 0
    for index in range(len(mlpStructure)):
        if index == 0:
            mlpParams += mlpStructure[index] * 27 + mlpStructure[index]
        else:
            mlpParams += mlpStructure[index] * mlpStructure[index-1] + mlpStructure[index]
    mlpParams += mlpStructure[-1] + 1

    MLP = mlpResult(mlpStructure)
    MLP.fit(xMLP,yMLP, epochs = 10, batch_size = 1, validation_split = 0)
    Predictions = MLP.predict(xTestData)
    Eps = mean_squared_error(yTestData, Predictions)
    
    Error.append(Eps)
    Params.append(mlpParams)
    modType.append("MLP")
    Layers.append(len(mlpStructure))
    GridSize.append(None)
    
    kanParams = 0

    for index in range(len(kanStructure)):
        if index == 0:
            kanParams += kanStructure[index]
        else:
            kanParams += kanStructure[index] * kanStructure[index-1] 

    kanParams = kanParams * 3 * gridSize

    print(kanStructure)
    KAN =  KAN(width = kanStructure, grid = gridSize, seed = sample)
    
    KAN.fit(data, opt="LBFGS", steps=50, lamb=0.001, loss_fn = torch.nn.MSELoss())
    Predictions = KAN(torch.tensor(xTestData.values, dtype=torch.float32))

    if torch.isnan(Predictions).any() == True:
        print("ERROR ON SAMPLE", sample)
        continue 
        
    Eps = mean_squared_error(yTestData, Predictions.detach().numpy())

    Error.append(Eps)
    Params.append(kanParams)
    modType.append("KAN")
    Layers.append(len(kanStructure)-1)
    GridSize.append(gridSize)
    
    
    
    
Results = pd.DataFrame({                    
                        "modType": modType,
                        "Params": Params,
                        "Hidden_Layers": Layers,
                        "GridSize": GridSize,
                        "Error": Error
                      })

Results.to_csv("Results.csv") 

Model: "sequential_59"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_276 (Dense)           (None, 29)                812       
                                                                 
 dense_277 (Dense)           (None, 47)                1410      
                                                                 
 dense_278 (Dense)           (None, 15)                720       
                                                                 
 dense_279 (Dense)           (None, 23)                368       
                                                                 
 dense_280 (Dense)           (None, 29)                696       
                                                                 
 dense_281 (Dense)           (None, 1)                 30        
                                                                 
Total params: 4,036
Trainable params: 4,036
Non-train

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.74e+03 | test_loss: nan | reg: 7.36e+01 | : 100%|███| 50/50 [01:18<00:00,  1.57s/it]

saving model version 0.1
Model: "sequential_60"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_282 (Dense)           (None, 19)                532       
                                                                 
 dense_283 (Dense)           (None, 14)                280       
                                                                 
 dense_284 (Dense)           (None, 2)                 30        
                                                                 
 dense_285 (Dense)           (None, 17)                51        
                                                                 
 dense_286 (Dense)           (None, 23)                414       
                                                                 
 dense_287 (Dense)           (None, 1)                 24        
                                                                 
Total params: 1,331
Trainabl




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 6, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.42e+03 | test_loss: nan | reg: 7.85e+01 | : 100%|███| 50/50 [01:07<00:00,  1.35s/it]

saving model version 0.1
Model: "sequential_61"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_288 (Dense)           (None, 24)                672       
                                                                 
 dense_289 (Dense)           (None, 41)                1025      
                                                                 
 dense_290 (Dense)           (None, 17)                714       
                                                                 
 dense_291 (Dense)           (None, 1)                 18        
                                                                 
Total params: 2,429
Trainable params: 2,429
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.24e+03 | test_loss: nan | reg: 4.41e+01 | : 100%|███| 50/50 [00:27<00:00,  1.79it/s]


saving model version 0.1
Model: "sequential_62"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_292 (Dense)           (None, 29)                812       
                                                                 
 dense_293 (Dense)           (None, 6)                 180       
                                                                 
 dense_294 (Dense)           (None, 21)                147       
                                                                 
 dense_295 (Dense)           (None, 19)                418       
                                                                 
 dense_296 (Dense)           (None, 20)                400       
                                                                 
 dense_297 (Dense)           (None, 1)                 21        
                                                                 
Total params: 1,978
Trainabl

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:18<00:00,  1.58s/it]

saving model version 0.1
ERROR ON SAMPLE 3
Model: "sequential_63"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_298 (Dense)           (None, 30)                840       
                                                                 
 dense_299 (Dense)           (None, 32)                992       
                                                                 
 dense_300 (Dense)           (None, 9)                 297       
                                                                 
 dense_301 (Dense)           (None, 1)                 10        
                                                                 
Total params: 2,139
Trainable params: 2,139
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.11e+03 | test_loss: nan | reg: 4.33e+01 | : 100%|███| 50/50 [00:46<00:00,  1.09it/s]

saving model version 0.1
Model: "sequential_64"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_302 (Dense)           (None, 22)                616       
                                                                 
 dense_303 (Dense)           (None, 22)                506       
                                                                 
 dense_304 (Dense)           (None, 41)                943       
                                                                 
 dense_305 (Dense)           (None, 1)                 42        
                                                                 
Total params: 2,107
Trainable params: 2,107
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:38<00:00,  1.29it/s]

saving model version 0.1
ERROR ON SAMPLE 5
Model: "sequential_65"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_306 (Dense)           (None, 32)                896       
                                                                 
 dense_307 (Dense)           (None, 16)                528       
                                                                 
 dense_308 (Dense)           (None, 34)                578       
                                                                 
 dense_309 (Dense)           (None, 1)                 35        
                                                                 
Total params: 2,037
Trainable params: 2,037
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.91e+03 | test_loss: nan | reg: 7.43e+01 | : 100%|███| 50/50 [00:32<00:00,  1.52it/s]

saving model version 0.1
Model: "sequential_66"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_310 (Dense)           (None, 20)                560       
                                                                 
 dense_311 (Dense)           (None, 29)                609       
                                                                 
 dense_312 (Dense)           (None, 25)                750       
                                                                 
 dense_313 (Dense)           (None, 7)                 182       
                                                                 
 dense_314 (Dense)           (None, 31)                248       
                                                                 
 dense_315 (Dense)           (None, 1)                 32        
                                                                 
Total params: 2,381
Trainabl




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.92e+03 | test_loss: nan | reg: 7.49e+01 | : 100%|███| 50/50 [01:18<00:00,  1.56s/it]

saving model version 0.1
Model: "sequential_67"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_316 (Dense)           (None, 36)                1008      
                                                                 
 dense_317 (Dense)           (None, 11)                407       
                                                                 
 dense_318 (Dense)           (None, 49)                588       
                                                                 
 dense_319 (Dense)           (None, 1)                 50        
                                                                 
Total params: 2,053
Trainable params: 2,053
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:02<00:00,  1.25s/it]

saving model version 0.1
ERROR ON SAMPLE 8
Model: "sequential_68"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_320 (Dense)           (None, 22)                616       
                                                                 
 dense_321 (Dense)           (None, 25)                575       
                                                                 
 dense_322 (Dense)           (None, 20)                520       
                                                                 
 dense_323 (Dense)           (None, 1)                 21        
                                                                 
Total params: 1,732
Trainable params: 1,732
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.17e+03 | test_loss: nan | reg: 4.88e+01 | : 100%|███| 50/50 [00:41<00:00,  1.20it/s]

saving model version 0.1
Model: "sequential_69"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_324 (Dense)           (None, 32)                896       
                                                                 
 dense_325 (Dense)           (None, 25)                825       
                                                                 
 dense_326 (Dense)           (None, 18)                468       
                                                                 
 dense_327 (Dense)           (None, 26)                494       
                                                                 
 dense_328 (Dense)           (None, 1)                 27        
                                                                 
Total params: 2,710
Trainable params: 2,710
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.03e+03 | test_loss: nan | reg: 5.36e+01 | : 100%|███| 50/50 [01:02<00:00,  1.25s/it]

saving model version 0.1
Model: "sequential_70"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_329 (Dense)           (None, 22)                616       
                                                                 
 dense_330 (Dense)           (None, 3)                 69        
                                                                 
 dense_331 (Dense)           (None, 22)                88        
                                                                 
 dense_332 (Dense)           (None, 28)                644       
                                                                 
 dense_333 (Dense)           (None, 14)                406       
                                                                 
 dense_334 (Dense)           (None, 1)                 15        
                                                                 
Total params: 1,838
Trainabl




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.38e+03 | test_loss: nan | reg: 9.16e+01 | : 100%|███| 50/50 [01:11<00:00,  1.43s/it]

saving model version 0.1
Model: "sequential_71"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_335 (Dense)           (None, 18)                504       
                                                                 
 dense_336 (Dense)           (None, 8)                 152       
                                                                 
 dense_337 (Dense)           (None, 10)                90        
                                                                 
 dense_338 (Dense)           (None, 1)                 11        
                                                                 
Total params: 757
Trainable params: 757
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.44e+03 | test_loss: nan | reg: 6.82e+01 | : 100%|███| 50/50 [00:47<00:00,  1.05it/s]

saving model version 0.1
Model: "sequential_72"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_339 (Dense)           (None, 33)                924       
                                                                 
 dense_340 (Dense)           (None, 30)                1020      
                                                                 
 dense_341 (Dense)           (None, 1)                 31        
                                                                 
Total params: 1,975
Trainable params: 1,975
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 3.79e+01 | : 100%|███| 50/50 [00:25<00:00,  1.95it/s]

saving model version 0.1
Model: "sequential_73"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_342 (Dense)           (None, 26)                728       
                                                                 
 dense_343 (Dense)           (None, 24)                648       
                                                                 
 dense_344 (Dense)           (None, 26)                650       
                                                                 
 dense_345 (Dense)           (None, 27)                729       
                                                                 
 dense_346 (Dense)           (None, 36)                1008      
                                                                 
 dense_347 (Dense)           (None, 1)                 37        
                                                                 
Total params: 3,800
Trainabl




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 2, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:05<00:00,  1.31s/it]

saving model version 0.1
ERROR ON SAMPLE 14
Model: "sequential_74"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_348 (Dense)           (None, 28)                784       
                                                                 
 dense_349 (Dense)           (None, 20)                580       
                                                                 
 dense_350 (Dense)           (None, 7)                 147       
                                                                 
 dense_351 (Dense)           (None, 1)                 8         
                                                                 
Total params: 1,519
Trainable params: 1,519
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.65e+02 | : 100%|███| 50/50 [00:19<00:00,  2.58it/s]


saving model version 0.1
Model: "sequential_75"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_352 (Dense)           (None, 10)                280       
                                                                 
 dense_353 (Dense)           (None, 26)                286       
                                                                 
 dense_354 (Dense)           (None, 19)                513       
                                                                 
 dense_355 (Dense)           (None, 1)                 20        
                                                                 
Total params: 1,099
Trainable params: 1,099
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 1]
checkpoint directory created

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.05e+03 | test_loss: nan | reg: 4.74e+01 | : 100%|███| 50/50 [00:44<00:00,  1.11it/s]

saving model version 0.1
Model: "sequential_76"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_356 (Dense)           (None, 6)                 168       
                                                                 
 dense_357 (Dense)           (None, 36)                252       
                                                                 
 dense_358 (Dense)           (None, 44)                1628      
                                                                 
 dense_359 (Dense)           (None, 1)                 45        
                                                                 
Total params: 2,093
Trainable params: 2,093
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 6.66e+01 | : 100%|███| 50/50 [00:40<00:00,  1.25it/s]

saving model version 0.1
Model: "sequential_77"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_360 (Dense)           (None, 47)                1316      
                                                                 
 dense_361 (Dense)           (None, 27)                1296      
                                                                 
 dense_362 (Dense)           (None, 31)                868       
                                                                 
 dense_363 (Dense)           (None, 1)                 32        
                                                                 
Total params: 3,512
Trainable params: 3,512
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.01e+03 | test_loss: nan | reg: 5.43e+01 | : 100%|███| 50/50 [00:48<00:00,  1.04it/s]

saving model version 0.1
Model: "sequential_78"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_364 (Dense)           (None, 22)                616       
                                                                 
 dense_365 (Dense)           (None, 21)                483       
                                                                 
 dense_366 (Dense)           (None, 23)                506       
                                                                 
 dense_367 (Dense)           (None, 1)                 24        
                                                                 
Total params: 1,629
Trainable params: 1,629
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 6.84e+01 | : 100%|███| 50/50 [00:22<00:00,  2.25it/s]


saving model version 0.1
Model: "sequential_79"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_368 (Dense)           (None, 27)                756       
                                                                 
 dense_369 (Dense)           (None, 2)                 56        
                                                                 
 dense_370 (Dense)           (None, 31)                93        
                                                                 
 dense_371 (Dense)           (None, 15)                480       
                                                                 
 dense_372 (Dense)           (None, 1)                 16        
                                                                 
Total params: 1,401
Trainable params: 1,401
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.23e+02 | : 100%|███| 50/50 [00:31<00:00,  1.58it/s]

saving model version 0.1
Model: "sequential_80"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_373 (Dense)           (None, 24)                672       
                                                                 
 dense_374 (Dense)           (None, 12)                300       
                                                                 
 dense_375 (Dense)           (None, 8)                 104       
                                                                 
 dense_376 (Dense)           (None, 1)                 9         
                                                                 
Total params: 1,085
Trainable params: 1,085
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 3.86e+01 | : 100%|███| 50/50 [00:21<00:00,  2.33it/s]


saving model version 0.1
Model: "sequential_81"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_377 (Dense)           (None, 10)                280       
                                                                 
 dense_378 (Dense)           (None, 23)                253       
                                                                 
 dense_379 (Dense)           (None, 15)                360       
                                                                 
 dense_380 (Dense)           (None, 1)                 16        
                                                                 
Total params: 909
Trainable params: 909
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 1]
checkpoint directory created: ./

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.26e+03 | test_loss: nan | reg: 7.14e+01 | : 100%|███| 50/50 [00:45<00:00,  1.09it/s]

saving model version 0.1
Model: "sequential_82"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_381 (Dense)           (None, 25)                700       
                                                                 
 dense_382 (Dense)           (None, 34)                884       
                                                                 
 dense_383 (Dense)           (None, 14)                490       
                                                                 
 dense_384 (Dense)           (None, 14)                210       
                                                                 
 dense_385 (Dense)           (None, 1)                 15        
                                                                 
Total params: 2,299
Trainable params: 2,299
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.65e+03 | test_loss: nan | reg: 6.48e+01 | : 100%|███| 50/50 [01:06<00:00,  1.32s/it]

saving model version 0.1
Model: "sequential_83"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_386 (Dense)           (None, 17)                476       
                                                                 
 dense_387 (Dense)           (None, 15)                270       
                                                                 
 dense_388 (Dense)           (None, 11)                176       
                                                                 
 dense_389 (Dense)           (None, 28)                336       
                                                                 
 dense_390 (Dense)           (None, 1)                 29        
                                                                 
Total params: 1,287
Trainable params: 1,287
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 4.86e+01 | : 100%|███| 50/50 [00:56<00:00,  1.13s/it]


saving model version 0.1
Model: "sequential_84"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_391 (Dense)           (None, 35)                980       
                                                                 
 dense_392 (Dense)           (None, 19)                684       
                                                                 
 dense_393 (Dense)           (None, 23)                460       
                                                                 
 dense_394 (Dense)           (None, 1)                 24        
                                                                 
Total params: 2,148
Trainable params: 2,148
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 1]
checkpoint directory created

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:45<00:00,  1.09it/s]

saving model version 0.1
ERROR ON SAMPLE 25
Model: "sequential_85"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_395 (Dense)           (None, 6)                 168       
                                                                 
 dense_396 (Dense)           (None, 32)                224       
                                                                 
 dense_397 (Dense)           (None, 28)                924       
                                                                 
 dense_398 (Dense)           (None, 1)                 29        
                                                                 
Total params: 1,345
Trainable params: 1,345
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.08e+03 | test_loss: nan | reg: 8.79e+01 | : 100%|███| 50/50 [00:43<00:00,  1.16it/s]

saving model version 0.1
Model: "sequential_86"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_399 (Dense)           (None, 22)                616       
                                                                 
 dense_400 (Dense)           (None, 29)                667       
                                                                 
 dense_401 (Dense)           (None, 24)                720       
                                                                 
 dense_402 (Dense)           (None, 27)                675       
                                                                 
 dense_403 (Dense)           (None, 1)                 28        
                                                                 
Total params: 2,706
Trainable params: 2,706
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.95e+03 | test_loss: nan | reg: 7.26e+01 | : 100%|███| 50/50 [01:05<00:00,  1.31s/it]

saving model version 0.1
Model: "sequential_87"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_404 (Dense)           (None, 42)                1176      
                                                                 
 dense_405 (Dense)           (None, 15)                645       
                                                                 
 dense_406 (Dense)           (None, 40)                640       
                                                                 
 dense_407 (Dense)           (None, 1)                 41        
                                                                 
Total params: 2,502
Trainable params: 2,502
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.20e+03 | test_loss: nan | reg: 6.09e+01 | : 100%|███| 50/50 [00:49<00:00,  1.02it/s]

saving model version 0.1
Model: "sequential_88"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_408 (Dense)           (None, 32)                896       
                                                                 
 dense_409 (Dense)           (None, 4)                 132       
                                                                 
 dense_410 (Dense)           (None, 30)                150       
                                                                 
 dense_411 (Dense)           (None, 1)                 31        
                                                                 
Total params: 1,209
Trainable params: 1,209
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 4.11e+01 | : 100%|███| 50/50 [00:41<00:00,  1.20it/s]

saving model version 0.1
Model: "sequential_89"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_412 (Dense)           (None, 40)                1120      
                                                                 
 dense_413 (Dense)           (None, 30)                1230      
                                                                 
 dense_414 (Dense)           (None, 1)                 31        
                                                                 
Total params: 2,381
Trainable params: 2,381
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.23e+03 | test_loss: nan | reg: 3.76e+01 | : 100%|███| 50/50 [00:26<00:00,  1.88it/s]

saving model version 0.1
Model: "sequential_90"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_415 (Dense)           (None, 22)                616       
                                                                 
 dense_416 (Dense)           (None, 17)                391       
                                                                 
 dense_417 (Dense)           (None, 17)                306       
                                                                 
 dense_418 (Dense)           (None, 1)                 18        
                                                                 
Total params: 1,331
Trainable params: 1,331
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.14e+03 | test_loss: nan | reg: 4.32e+01 | : 100%|███| 50/50 [00:49<00:00,  1.02it/s]

saving model version 0.1
Model: "sequential_91"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_419 (Dense)           (None, 35)                980       
                                                                 
 dense_420 (Dense)           (None, 26)                936       
                                                                 
 dense_421 (Dense)           (None, 31)                837       
                                                                 
 dense_422 (Dense)           (None, 1)                 32        
                                                                 
Total params: 2,785
Trainable params: 2,785
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.72e+03 | test_loss: nan | reg: 5.94e+01 | : 100%|███| 50/50 [00:56<00:00,  1.14s/it]

saving model version 0.1
Model: "sequential_92"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_423 (Dense)           (None, 9)                 252       
                                                                 
 dense_424 (Dense)           (None, 19)                190       
                                                                 
 dense_425 (Dense)           (None, 28)                560       
                                                                 
 dense_426 (Dense)           (None, 1)                 29        
                                                                 
Total params: 1,031
Trainable params: 1,031
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.98e+03 | test_loss: nan | reg: 6.36e+01 | : 100%|███| 50/50 [00:57<00:00,  1.14s/it]

saving model version 0.1
Model: "sequential_93"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_427 (Dense)           (None, 18)                504       
                                                                 
 dense_428 (Dense)           (None, 20)                380       
                                                                 
 dense_429 (Dense)           (None, 12)                252       
                                                                 
 dense_430 (Dense)           (None, 1)                 13        
                                                                 
Total params: 1,149
Trainable params: 1,149
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 4.14e+01 | : 100%|███| 50/50 [00:35<00:00,  1.39it/s]

saving model version 0.1
Model: "sequential_94"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_431 (Dense)           (None, 21)                588       
                                                                 
 dense_432 (Dense)           (None, 1)                 22        
                                                                 
Total params: 610
Trainable params: 610
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.04e+02 | : 100%|███| 50/50 [00:07<00:00,  6.28it/s]


saving model version 0.1
Model: "sequential_95"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_433 (Dense)           (None, 40)                1120      
                                                                 
 dense_434 (Dense)           (None, 37)                1517      
                                                                 
 dense_435 (Dense)           (None, 17)                646       
                                                                 
 dense_436 (Dense)           (None, 26)                468       
                                                                 
 dense_437 (Dense)           (None, 1)                 27        
                                                                 
Total params: 3,778
Trainable params: 3,778
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 7.17e+01 | : 100%|███| 50/50 [00:42<00:00,  1.17it/s]


saving model version 0.1
Model: "sequential_96"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_438 (Dense)           (None, 32)                896       
                                                                 
 dense_439 (Dense)           (None, 12)                396       
                                                                 
 dense_440 (Dense)           (None, 35)                455       
                                                                 
 dense_441 (Dense)           (None, 1)                 36        
                                                                 
Total params: 1,783
Trainable params: 1,783
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 4, 1]
checkpoint directory created

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.07e+03 | test_loss: nan | reg: 5.73e+01 | : 100%|███| 50/50 [00:54<00:00,  1.08s/it]

saving model version 0.1
Model: "sequential_97"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_442 (Dense)           (None, 22)                616       
                                                                 
 dense_443 (Dense)           (None, 28)                644       
                                                                 
 dense_444 (Dense)           (None, 41)                1189      
                                                                 
 dense_445 (Dense)           (None, 13)                546       
                                                                 
 dense_446 (Dense)           (None, 1)                 14        
                                                                 
Total params: 3,009
Trainable params: 3,009
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.38e+03 | test_loss: nan | reg: 6.99e+01 | : 100%|███| 50/50 [01:02<00:00,  1.26s/it]

saving model version 0.1
Model: "sequential_98"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_447 (Dense)           (None, 27)                756       
                                                                 
 dense_448 (Dense)           (None, 26)                728       
                                                                 
 dense_449 (Dense)           (None, 49)                1323      
                                                                 
 dense_450 (Dense)           (None, 1)                 50        
                                                                 
 dense_451 (Dense)           (None, 1)                 2         
                                                                 
Total params: 2,859
Trainable params: 2,859
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 2, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.58e+03 | test_loss: nan | reg: 1.13e+02 | : 100%|███| 50/50 [01:06<00:00,  1.33s/it]

saving model version 0.1
Model: "sequential_99"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_452 (Dense)           (None, 24)                672       
                                                                 
 dense_453 (Dense)           (None, 34)                850       
                                                                 
 dense_454 (Dense)           (None, 1)                 35        
                                                                 
Total params: 1,557
Trainable params: 1,557
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.89e+03 | test_loss: nan | reg: 4.81e+01 | : 100%|███| 50/50 [00:31<00:00,  1.57it/s]

saving model version 0.1
Model: "sequential_100"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_455 (Dense)           (None, 26)                728       
                                                                 
 dense_456 (Dense)           (None, 16)                432       
                                                                 
 dense_457 (Dense)           (None, 15)                255       
                                                                 
 dense_458 (Dense)           (None, 1)                 16        
                                                                 
Total params: 1,431
Trainable params: 1,431
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.60e+03 | test_loss: nan | reg: 5.94e+01 | : 100%|███| 50/50 [00:54<00:00,  1.10s/it]

saving model version 0.1
Model: "sequential_101"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_459 (Dense)           (None, 24)                672       
                                                                 
 dense_460 (Dense)           (None, 40)                1000      
                                                                 
 dense_461 (Dense)           (None, 23)                943       
                                                                 
 dense_462 (Dense)           (None, 1)                 24        
                                                                 
Total params: 2,639
Trainable params: 2,639
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.31e+03 | test_loss: nan | reg: 2.42e+03 | : 100%|███| 50/50 [00:32<00:00,  1.56it/s]

saving model version 0.1
Model: "sequential_102"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_463 (Dense)           (None, 16)                448       
                                                                 
 dense_464 (Dense)           (None, 20)                340       
                                                                 
 dense_465 (Dense)           (None, 21)                441       
                                                                 
 dense_466 (Dense)           (None, 1)                 22        
                                                                 
Total params: 1,251
Trainable params: 1,251
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.14e+03 | test_loss: nan | reg: 5.45e+01 | : 100%|███| 50/50 [01:00<00:00,  1.20s/it]

saving model version 0.1
Model: "sequential_103"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_467 (Dense)           (None, 38)                1064      
                                                                 
 dense_468 (Dense)           (None, 9)                 351       
                                                                 
 dense_469 (Dense)           (None, 1)                 10        
                                                                 
Total params: 1,425
Trainable params: 1,425
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.27e+03 | test_loss: nan | reg: 7.56e+01 | : 100%|███| 50/50 [00:22<00:00,  2.23it/s]

saving model version 0.1
Model: "sequential_104"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_470 (Dense)           (None, 28)                784       
                                                                 
 dense_471 (Dense)           (None, 23)                667       
                                                                 
 dense_472 (Dense)           (None, 2)                 48        
                                                                 
 dense_473 (Dense)           (None, 1)                 3         
                                                                 
Total params: 1,502
Trainable params: 1,502
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.13e+03 | test_loss: nan | reg: 4.63e+01 | : 100%|███| 50/50 [00:42<00:00,  1.18it/s]

saving model version 0.1
Model: "sequential_105"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_474 (Dense)           (None, 37)                1036      
                                                                 
 dense_475 (Dense)           (None, 17)                646       
                                                                 
 dense_476 (Dense)           (None, 23)                414       
                                                                 
 dense_477 (Dense)           (None, 19)                456       
                                                                 
 dense_478 (Dense)           (None, 1)                 20        
                                                                 
Total params: 2,572
Trainable params: 2,572
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.89e+03 | test_loss: nan | reg: 6.44e+01 | : 100%|███| 50/50 [01:06<00:00,  1.33s/it]

saving model version 0.1
Model: "sequential_106"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_479 (Dense)           (None, 38)                1064      
                                                                 
 dense_480 (Dense)           (None, 31)                1209      
                                                                 
 dense_481 (Dense)           (None, 1)                 32        
                                                                 
Total params: 2,305
Trainable params: 2,305
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.28e+03 | test_loss: nan | reg: 2.80e+01 | : 100%|███| 50/50 [00:26<00:00,  1.86it/s]


saving model version 0.1
Model: "sequential_107"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_482 (Dense)           (None, 14)                392       
                                                                 
 dense_483 (Dense)           (None, 36)                540       
                                                                 
 dense_484 (Dense)           (None, 1)                 37        
                                                                 
Total params: 969
Trainable params: 969
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.27e+03 | test_loss: nan | reg: 7.49e+01 | : 100%|███| 50/50 [00:32<00:00,  1.54it/s]

saving model version 0.1
Model: "sequential_108"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_485 (Dense)           (None, 17)                476       
                                                                 
 dense_486 (Dense)           (None, 43)                774       
                                                                 
 dense_487 (Dense)           (None, 1)                 44        
                                                                 
Total params: 1,294
Trainable params: 1,294
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.09e+03 | test_loss: nan | reg: 2.93e+01 | : 100%|███| 50/50 [00:31<00:00,  1.57it/s]

saving model version 0.1
Model: "sequential_109"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_488 (Dense)           (None, 25)                700       
                                                                 
 dense_489 (Dense)           (None, 1)                 26        
                                                                 
Total params: 726
Trainable params: 726
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.02e+02 | : 100%|███| 50/50 [00:05<00:00,  9.39it/s]


saving model version 0.1
Model: "sequential_110"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_490 (Dense)           (None, 26)                728       
                                                                 
 dense_491 (Dense)           (None, 11)                297       
                                                                 
 dense_492 (Dense)           (None, 25)                300       
                                                                 
 dense_493 (Dense)           (None, 1)                 26        
                                                                 
Total params: 1,351
Trainable params: 1,351
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.13e+03 | test_loss: nan | reg: 4.31e+01 | : 100%|███| 50/50 [00:47<00:00,  1.06it/s]

saving model version 0.1
Model: "sequential_111"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_494 (Dense)           (None, 12)                336       
                                                                 
 dense_495 (Dense)           (None, 17)                221       
                                                                 
 dense_496 (Dense)           (None, 29)                522       
                                                                 
 dense_497 (Dense)           (None, 32)                960       
                                                                 
 dense_498 (Dense)           (None, 1)                 33        
                                                                 
Total params: 2,072
Trainable params: 2,072
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:08<00:00,  1.38s/it]

saving model version 0.1
ERROR ON SAMPLE 52
Model: "sequential_112"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_499 (Dense)           (None, 37)                1036      
                                                                 
 dense_500 (Dense)           (None, 19)                722       
                                                                 
 dense_501 (Dense)           (None, 49)                980       
                                                                 
 dense_502 (Dense)           (None, 1)                 50        
                                                                 
Total params: 2,788
Trainable params: 2,788
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 7.63e+01 | : 100%|███| 50/50 [00:38<00:00,  1.29it/s]


saving model version 0.1
Model: "sequential_113"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_503 (Dense)           (None, 14)                392       
                                                                 
 dense_504 (Dense)           (None, 1)                 15        
                                                                 
Total params: 407
Trainable params: 407
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.03e+02 | : 100%|███| 50/50 [00:05<00:00, 10.00it/s]


saving model version 0.1
Model: "sequential_114"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_505 (Dense)           (None, 24)                672       
                                                                 
 dense_506 (Dense)           (None, 1)                 25        
                                                                 
Total params: 697
Trainable params: 697
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.02e+02 | : 100%|███| 50/50 [00:07<00:00,  6.34it/s]


saving model version 0.1
Model: "sequential_115"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_507 (Dense)           (None, 31)                868       
                                                                 
 dense_508 (Dense)           (None, 20)                640       
                                                                 
 dense_509 (Dense)           (None, 1)                 21        
                                                                 
Total params: 1,529
Trainable params: 1,529
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.09e+03 | test_loss: nan | reg: 3.17e+01 | : 100%|███| 50/50 [00:28<00:00,  1.73it/s]

saving model version 0.1
Model: "sequential_116"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_510 (Dense)           (None, 23)                644       
                                                                 
 dense_511 (Dense)           (None, 17)                408       
                                                                 
 dense_512 (Dense)           (None, 47)                846       
                                                                 
 dense_513 (Dense)           (None, 1)                 48        
                                                                 
Total params: 1,946
Trainable params: 1,946
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 1, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.64e+03 | test_loss: nan | reg: 7.87e+01 | : 100%|███| 50/50 [00:45<00:00,  1.09it/s]

saving model version 0.1
Model: "sequential_117"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_514 (Dense)           (None, 4)                 112       
                                                                 
 dense_515 (Dense)           (None, 25)                125       
                                                                 
 dense_516 (Dense)           (None, 1)                 26        
                                                                 
Total params: 263
Trainable params: 263
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.27e+03 | test_loss: nan | reg: 6.40e+01 | : 100%|███| 50/50 [00:29<00:00,  1.71it/s]

saving model version 0.1
Model: "sequential_118"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_517 (Dense)           (None, 31)                868       
                                                                 
 dense_518 (Dense)           (None, 1)                 32        
                                                                 
Total params: 900
Trainable params: 900
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.01e+02 | : 100%|███| 50/50 [00:05<00:00,  8.99it/s]


saving model version 0.1
Model: "sequential_119"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_519 (Dense)           (None, 19)                532       
                                                                 
 dense_520 (Dense)           (None, 13)                260       
                                                                 
 dense_521 (Dense)           (None, 1)                 14        
                                                                 
Total params: 806
Trainable params: 806
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.39e+03 | test_loss: nan | reg: 5.64e+02 | : 100%|███| 50/50 [00:19<00:00,  2.52it/s]

saving model version 0.1
Model: "sequential_120"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_522 (Dense)           (None, 29)                812       
                                                                 
 dense_523 (Dense)           (None, 36)                1080      
                                                                 
 dense_524 (Dense)           (None, 32)                1184      
                                                                 
 dense_525 (Dense)           (None, 1)                 33        
                                                                 
Total params: 3,109
Trainable params: 3,109
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.18e+03 | test_loss: nan | reg: 4.51e+01 | : 100%|███| 50/50 [00:40<00:00,  1.25it/s]

saving model version 0.1
Model: "sequential_121"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_526 (Dense)           (None, 20)                560       
                                                                 
 dense_527 (Dense)           (None, 36)                756       
                                                                 
 dense_528 (Dense)           (None, 34)                1258      
                                                                 
 dense_529 (Dense)           (None, 1)                 35        
                                                                 
Total params: 2,609
Trainable params: 2,609
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.31e+03 | test_loss: nan | reg: 4.89e+01 | : 100%|███| 50/50 [00:34<00:00,  1.45it/s]

saving model version 0.1
Model: "sequential_122"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_530 (Dense)           (None, 36)                1008      
                                                                 
 dense_531 (Dense)           (None, 1)                 37        
                                                                 
Total params: 1,045
Trainable params: 1,045
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.02e+02 | : 100%|███| 50/50 [00:06<00:00,  8.18it/s]

saving model version 0.1
Model: "sequential_123"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_532 (Dense)           (None, 5)                 140       
                                                                 
 dense_533 (Dense)           (None, 47)                282       
                                                                 
 dense_534 (Dense)           (None, 21)                1008      
                                                                 
 dense_535 (Dense)           (None, 15)                330       
                                                                 
 dense_536 (Dense)           (None, 1)                 16        
                                                                 
Total params: 1,776
Trainable params: 1,776
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 3, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:58<00:00,  1.16s/it]

saving model version 0.1
ERROR ON SAMPLE 64
Model: "sequential_124"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_537 (Dense)           (None, 20)                560       
                                                                 
 dense_538 (Dense)           (None, 20)                420       
                                                                 
 dense_539 (Dense)           (None, 1)                 21        
                                                                 
Total params: 1,001
Trainable params: 1,001
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.67e+03 | test_loss: nan | reg: 6.14e+01 | : 100%|███| 50/50 [00:39<00:00,  1.28it/s]

saving model version 0.1
Model: "sequential_125"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_540 (Dense)           (None, 14)                392       
                                                                 
 dense_541 (Dense)           (None, 17)                255       
                                                                 
 dense_542 (Dense)           (None, 41)                738       
                                                                 
 dense_543 (Dense)           (None, 39)                1638      
                                                                 
 dense_544 (Dense)           (None, 1)                 40        
                                                                 
Total params: 3,063
Trainable params: 3,063
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.21e+03 | test_loss: nan | reg: 5.59e+03 | : 100%|███| 50/50 [00:59<00:00,  1.19s/it]

saving model version 0.1
Model: "sequential_126"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_545 (Dense)           (None, 26)                728       
                                                                 
 dense_546 (Dense)           (None, 37)                999       
                                                                 
 dense_547 (Dense)           (None, 19)                722       
                                                                 
 dense_548 (Dense)           (None, 37)                740       
                                                                 
 dense_549 (Dense)           (None, 1)                 38        
                                                                 
Total params: 3,227
Trainable params: 3,227
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 5.72e+03 | test_loss: nan | reg: 1.37e+03 | : 100%|███| 50/50 [00:33<00:00,  1.51it/s]

saving model version 0.1
Model: "sequential_127"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_550 (Dense)           (None, 27)                756       
                                                                 
 dense_551 (Dense)           (None, 33)                924       
                                                                 
 dense_552 (Dense)           (None, 1)                 34        
                                                                 
Total params: 1,714
Trainable params: 1,714
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.32e+03 | test_loss: nan | reg: 3.28e+01 | : 100%|███| 50/50 [00:31<00:00,  1.57it/s]

saving model version 0.1
Model: "sequential_128"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_553 (Dense)           (None, 19)                532       
                                                                 
 dense_554 (Dense)           (None, 19)                380       
                                                                 
 dense_555 (Dense)           (None, 29)                580       
                                                                 
 dense_556 (Dense)           (None, 36)                1080      
                                                                 
 dense_557 (Dense)           (None, 1)                 37        
                                                                 
Total params: 2,609
Trainable params: 2,609
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 3.93e+01 | : 100%|███| 50/50 [00:26<00:00,  1.86it/s]


saving model version 0.1
Model: "sequential_129"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_558 (Dense)           (None, 27)                756       
                                                                 
 dense_559 (Dense)           (None, 21)                588       
                                                                 
 dense_560 (Dense)           (None, 36)                792       
                                                                 
 dense_561 (Dense)           (None, 21)                777       
                                                                 
 dense_562 (Dense)           (None, 1)                 22        
                                                                 
Total params: 2,935
Trainable params: 2,935
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/1

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 5.12e+03 | test_loss: nan | reg: 1.16e+03 | : 100%|███| 50/50 [00:55<00:00,  1.11s/it]

saving model version 0.1
Model: "sequential_130"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_563 (Dense)           (None, 13)                364       
                                                                 
 dense_564 (Dense)           (None, 30)                420       
                                                                 
 dense_565 (Dense)           (None, 31)                961       
                                                                 
 dense_566 (Dense)           (None, 1)                 32        
                                                                 
Total params: 1,777
Trainable params: 1,777
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.50e+03 | test_loss: nan | reg: 5.56e+01 | : 100%|███| 50/50 [00:46<00:00,  1.08it/s]

saving model version 0.1
Model: "sequential_131"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_567 (Dense)           (None, 18)                504       
                                                                 
 dense_568 (Dense)           (None, 31)                589       
                                                                 
 dense_569 (Dense)           (None, 8)                 256       
                                                                 
 dense_570 (Dense)           (None, 1)                 9         
                                                                 
Total params: 1,358
Trainable params: 1,358
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.49e+03 | test_loss: nan | reg: 7.54e+01 | : 100%|███| 50/50 [00:54<00:00,  1.09s/it]

saving model version 0.1
Model: "sequential_132"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_571 (Dense)           (None, 46)                1288      
                                                                 
 dense_572 (Dense)           (None, 28)                1316      
                                                                 
 dense_573 (Dense)           (None, 25)                725       
                                                                 
 dense_574 (Dense)           (None, 10)                260       
                                                                 
 dense_575 (Dense)           (None, 1)                 11        
                                                                 
Total params: 3,600
Trainable params: 3,600
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.19e+03 | test_loss: nan | reg: 3.73e+01 | : 100%|███| 50/50 [00:47<00:00,  1.06it/s]

saving model version 0.1
Model: "sequential_133"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_576 (Dense)           (None, 19)                532       
                                                                 
 dense_577 (Dense)           (None, 34)                680       
                                                                 
 dense_578 (Dense)           (None, 19)                665       
                                                                 
 dense_579 (Dense)           (None, 38)                760       
                                                                 
 dense_580 (Dense)           (None, 1)                 39        
                                                                 
Total params: 2,676
Trainable params: 2,676
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 6.34e+01 | : 100%|███| 50/50 [01:06<00:00,  1.33s/it]

saving model version 0.1
Model: "sequential_134"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_581 (Dense)           (None, 26)                728       
                                                                 
 dense_582 (Dense)           (None, 44)                1188      
                                                                 
 dense_583 (Dense)           (None, 1)                 45        
                                                                 
Total params: 1,961
Trainable params: 1,961
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.14e+03 | test_loss: nan | reg: 3.28e+01 | : 100%|███| 50/50 [00:22<00:00,  2.24it/s]

saving model version 0.1
Model: "sequential_135"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_584 (Dense)           (None, 19)                532       
                                                                 
 dense_585 (Dense)           (None, 19)                380       
                                                                 
 dense_586 (Dense)           (None, 23)                460       
                                                                 
 dense_587 (Dense)           (None, 27)                648       
                                                                 
 dense_588 (Dense)           (None, 1)                 28        
                                                                 





Total params: 2,048
Trainable params: 2,048
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.61e+03 | test_loss: nan | reg: 7.19e+01 | : 100%|███| 50/50 [00:59<00:00,  1.19s/it]

saving model version 0.1
Model: "sequential_136"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_589 (Dense)           (None, 32)                896       
                                                                 
 dense_590 (Dense)           (None, 29)                957       
                                                                 
 dense_591 (Dense)           (None, 5)                 150       
                                                                 
 dense_592 (Dense)           (None, 1)                 6         
                                                                 
Total params: 2,009
Trainable params: 2,009
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.16e+03 | test_loss: nan | reg: 3.40e+01 | : 100%|███| 50/50 [00:45<00:00,  1.10it/s]

saving model version 0.1
Model: "sequential_137"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_593 (Dense)           (None, 22)                616       
                                                                 
 dense_594 (Dense)           (None, 31)                713       
                                                                 
 dense_595 (Dense)           (None, 30)                960       
                                                                 
 dense_596 (Dense)           (None, 1)                 31        
                                                                 
Total params: 2,320
Trainable params: 2,320
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.76e+03 | test_loss: nan | reg: 5.87e+01 | : 100%|███| 50/50 [00:47<00:00,  1.05it/s]

saving model version 0.1
Model: "sequential_138"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_597 (Dense)           (None, 26)                728       
                                                                 
 dense_598 (Dense)           (None, 1)                 27        
                                                                 
Total params: 755
Trainable params: 755
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 6.07e+02 | : 100%|███| 50/50 [00:10<00:00,  4.74it/s]

saving model version 0.1
Model: "sequential_139"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_599 (Dense)           (None, 27)                756       
                                                                 
 dense_600 (Dense)           (None, 13)                364       
                                                                 





 dense_601 (Dense)           (None, 31)                434       
                                                                 
 dense_602 (Dense)           (None, 15)                480       
                                                                 
 dense_603 (Dense)           (None, 21)                336       
                                                                 
 dense_604 (Dense)           (None, 1)                 22        
                                                                 
Total params: 2,392
Trainable params: 2,392
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.26e+03 | test_loss: nan | reg: 1.59e+03 | : 100%|███| 50/50 [01:01<00:00,  1.22s/it]

saving model version 0.1
Model: "sequential_140"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_605 (Dense)           (None, 13)                364       
                                                                 
 dense_606 (Dense)           (None, 8)                 112       
                                                                 
 dense_607 (Dense)           (None, 1)                 9         
                                                                 
Total params: 485
Trainable params: 485
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 2.64e+01 | : 100%|███| 50/50 [00:26<00:00,  1.86it/s]


saving model version 0.1
Model: "sequential_141"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_608 (Dense)           (None, 11)                308       
                                                                 
 dense_609 (Dense)           (None, 31)                372       
                                                                 
 dense_610 (Dense)           (None, 25)                800       
                                                                 
 dense_611 (Dense)           (None, 22)                572       
                                                                 
 dense_612 (Dense)           (None, 1)                 23        
                                                                 
Total params: 2,075
Trainable params: 2,075
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/1

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.42e+03 | test_loss: nan | reg: 8.24e+01 | : 100%|███| 50/50 [01:13<00:00,  1.46s/it]

saving model version 0.1
Model: "sequential_142"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_613 (Dense)           (None, 14)                392       
                                                                 
 dense_614 (Dense)           (None, 32)                480       
                                                                 
 dense_615 (Dense)           (None, 36)                1188      
                                                                 
 dense_616 (Dense)           (None, 18)                666       
                                                                 
 dense_617 (Dense)           (None, 1)                 19        
                                                                 
Total params: 2,745
Trainable params: 2,745
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:01<00:00,  1.24s/it]

saving model version 0.1
ERROR ON SAMPLE 83
Model: "sequential_143"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_618 (Dense)           (None, 20)                560       
                                                                 
 dense_619 (Dense)           (None, 12)                252       
                                                                 
 dense_620 (Dense)           (None, 18)                234       
                                                                 
 dense_621 (Dense)           (None, 1)                 19        
                                                                 
Total params: 1,065
Trainable params: 1,065
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 6.85e+01 | : 100%|███| 50/50 [00:25<00:00,  1.96it/s]


saving model version 0.1
Model: "sequential_144"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_622 (Dense)           (None, 49)                1372      
                                                                 
 dense_623 (Dense)           (None, 12)                600       
                                                                 
 dense_624 (Dense)           (None, 7)                 91        
                                                                 
 dense_625 (Dense)           (None, 1)                 8         
                                                                 
Total params: 2,071
Trainable params: 2,071
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 3.71e+01 | : 100%|███| 50/50 [00:36<00:00,  1.37it/s]

saving model version 0.1
Model: "sequential_145"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_626 (Dense)           (None, 19)                532       
                                                                 
 dense_627 (Dense)           (None, 19)                380       
                                                                 
 dense_628 (Dense)           (None, 1)                 20        
                                                                 
Total params: 932
Trainable params: 932
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 3.39e+01 | : 100%|███| 50/50 [00:31<00:00,  1.60it/s]

saving model version 0.1
Model: "sequential_146"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_629 (Dense)           (None, 26)                728       
                                                                 
 dense_630 (Dense)           (None, 21)                567       
                                                                 
 dense_631 (Dense)           (None, 29)                638       
                                                                 
 dense_632 (Dense)           (None, 1)                 30        
                                                                 
Total params: 1,963
Trainable params: 1,963
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 5.02e+01 | : 100%|███| 50/50 [00:45<00:00,  1.11it/s]

saving model version 0.1
Model: "sequential_147"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_633 (Dense)           (None, 47)                1316      
                                                                 
 dense_634 (Dense)           (None, 26)                1248      
                                                                 
 dense_635 (Dense)           (None, 35)                945       
                                                                 
 dense_636 (Dense)           (None, 1)                 36        
                                                                 
Total params: 3,545
Trainable params: 3,545
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.13e+03 | test_loss: nan | reg: 4.72e+01 | : 100%|███| 50/50 [00:47<00:00,  1.04it/s]

saving model version 0.1
Model: "sequential_148"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_637 (Dense)           (None, 25)                700       
                                                                 
 dense_638 (Dense)           (None, 1)                 26        
                                                                 
Total params: 726
Trainable params: 726
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.04e+02 | : 100%|███| 50/50 [00:05<00:00,  9.20it/s]

saving model version 0.1
Model: "sequential_149"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_639 (Dense)           (None, 23)                644       
                                                                 
 dense_640 (Dense)           (None, 17)                408       
                                                                 
 dense_641 (Dense)           (None, 11)                198       
                                                                 
 dense_642 (Dense)           (None, 1)                 12        
                                                                 
Total params: 1,262
Trainable params: 1,262
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.85e+03 | test_loss: nan | reg: 9.80e+01 | : 100%|███| 50/50 [00:44<00:00,  1.11it/s]

saving model version 0.1
Model: "sequential_150"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_643 (Dense)           (None, 14)                392       
                                                                 
 dense_644 (Dense)           (None, 22)                330       
                                                                 
 dense_645 (Dense)           (None, 1)                 23        
                                                                 
Total params: 745
Trainable params: 745
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.32e+03 | test_loss: nan | reg: 3.64e+01 | : 100%|███| 50/50 [00:20<00:00,  2.48it/s]

saving model version 0.1
Model: "sequential_151"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_646 (Dense)           (None, 28)                784       
                                                                 
 dense_647 (Dense)           (None, 2)                 58        
                                                                 
 dense_648 (Dense)           (None, 3)                 9         
                                                                 
 dense_649 (Dense)           (None, 1)                 4         
                                                                 
Total params: 855
Trainable params: 855
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.49e+03 | test_loss: nan | reg: 7.42e+01 | : 100%|███| 50/50 [00:47<00:00,  1.05it/s]

saving model version 0.1
Model: "sequential_152"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_650 (Dense)           (None, 36)                1008      
                                                                 
 dense_651 (Dense)           (None, 30)                1110      
                                                                 
 dense_652 (Dense)           (None, 28)                868       
                                                                 
 dense_653 (Dense)           (None, 10)                290       
                                                                 
 dense_654 (Dense)           (None, 36)                396       
                                                                 
 dense_655 (Dense)           (None, 1)                 37        
                                                                 
Total params: 3,709
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 4, 4, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.14e+03 | test_loss: nan | reg: 6.32e+01 | : 100%|███| 50/50 [01:31<00:00,  1.83s/it]

saving model version 0.1
Model: "sequential_153"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_656 (Dense)           (None, 40)                1120      
                                                                 
 dense_657 (Dense)           (None, 43)                1763      
                                                                 
 dense_658 (Dense)           (None, 15)                660       
                                                                 
 dense_659 (Dense)           (None, 25)                400       
                                                                 
 dense_660 (Dense)           (None, 1)                 26        
                                                                 
Total params: 3,969
Trainable params: 3,969
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.35e+03 | test_loss: nan | reg: 1.59e+02 | : 100%|███| 50/50 [00:39<00:00,  1.25it/s]

saving model version 0.1
Model: "sequential_154"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_661 (Dense)           (None, 19)                532       
                                                                 
 dense_662 (Dense)           (None, 31)                620       
                                                                 
 dense_663 (Dense)           (None, 1)                 32        
                                                                 
Total params: 1,184
Trainable params: 1,184
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 3.88e+01 | : 100%|███| 50/50 [00:16<00:00,  3.10it/s]

saving model version 0.1
Model: "sequential_155"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_664 (Dense)           (None, 25)                700       
                                                                 
 dense_665 (Dense)           (None, 29)                754       
                                                                 
 dense_666 (Dense)           (None, 16)                480       
                                                                 
 dense_667 (Dense)           (None, 1)                 17        
                                                                 
Total params: 1,951
Trainable params: 1,951
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 7.25e+01 | : 100%|███| 50/50 [00:48<00:00,  1.03it/s]

saving model version 0.1
Model: "sequential_156"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_668 (Dense)           (None, 21)                588       
                                                                 
 dense_669 (Dense)           (None, 1)                 22        
                                                                 
Total params: 610
Trainable params: 610
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.28e+03 | test_loss: nan | reg: 4.53e+02 | : 100%|███| 50/50 [00:08<00:00,  6.11it/s]

saving model version 0.1
Model: "sequential_157"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_670 (Dense)           (None, 41)                1148      
                                                                 
 dense_671 (Dense)           (None, 18)                756       
                                                                 
 dense_672 (Dense)           (None, 25)                475       
                                                                 
 dense_673 (Dense)           (None, 1)                 26        
                                                                 
Total params: 2,405
Trainable params: 2,405
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:41<00:00,  1.21it/s]

saving model version 0.1
ERROR ON SAMPLE 98
Model: "sequential_158"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_674 (Dense)           (None, 46)                1288      
                                                                 
 dense_675 (Dense)           (None, 38)                1786      
                                                                 
 dense_676 (Dense)           (None, 24)                936       
                                                                 
 dense_677 (Dense)           (None, 1)                 25        
                                                                 
Total params: 4,035
Trainable params: 4,035
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.20e+03 | test_loss: nan | reg: 3.41e+01 | : 100%|███| 50/50 [00:42<00:00,  1.18it/s]

saving model version 0.1
Model: "sequential_159"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_678 (Dense)           (None, 28)                784       
                                                                 
 dense_679 (Dense)           (None, 1)                 29        
                                                                 
Total params: 813
Trainable params: 813
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.03e+02 | : 100%|███| 50/50 [00:05<00:00,  8.54it/s]


saving model version 0.1
Model: "sequential_160"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_680 (Dense)           (None, 31)                868       
                                                                 
 dense_681 (Dense)           (None, 30)                960       
                                                                 
 dense_682 (Dense)           (None, 22)                682       
                                                                 
 dense_683 (Dense)           (None, 31)                713       
                                                                 
 dense_684 (Dense)           (None, 32)                1024      
                                                                 
 dense_685 (Dense)           (None, 19)                627       
                                                                 
 dense_686 (Dense)         

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:35<00:00,  1.91s/it]

saving model version 0.1
ERROR ON SAMPLE 101
Model: "sequential_161"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_687 (Dense)           (None, 34)                952       
                                                                 
 dense_688 (Dense)           (None, 16)                560       
                                                                 
 dense_689 (Dense)           (None, 28)                476       
                                                                 
 dense_690 (Dense)           (None, 16)                464       
                                                                 
 dense_691 (Dense)           (None, 3)                 51        
                                                                 
 dense_692 (Dense)           (None, 1)                 4         
                                                                 
Total p




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.71e+03 | test_loss: nan | reg: 1.22e+02 | : 100%|███| 50/50 [01:20<00:00,  1.60s/it]

saving model version 0.1
Model: "sequential_162"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_693 (Dense)           (None, 22)                616       
                                                                 
 dense_694 (Dense)           (None, 21)                483       
                                                                 
 dense_695 (Dense)           (None, 1)                 22        
                                                                 
Total params: 1,121
Trainable params: 1,121
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.31e+03 | test_loss: nan | reg: 1.00e+03 | : 100%|███| 50/50 [00:29<00:00,  1.69it/s]

saving model version 0.1
Model: "sequential_163"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_696 (Dense)           (None, 20)                560       
                                                                 
 dense_697 (Dense)           (None, 34)                714       
                                                                 
 dense_698 (Dense)           (None, 19)                665       
                                                                 
 dense_699 (Dense)           (None, 1)                 20        
                                                                 
Total params: 1,959
Trainable params: 1,959
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.87e+03 | test_loss: nan | reg: 9.48e+01 | : 100%|███| 50/50 [00:52<00:00,  1.04s/it]

saving model version 0.1
Model: "sequential_164"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_700 (Dense)           (None, 19)                532       
                                                                 
 dense_701 (Dense)           (None, 26)                520       
                                                                 
 dense_702 (Dense)           (None, 24)                648       
                                                                 
 dense_703 (Dense)           (None, 1)                 25        
                                                                 
Total params: 1,725
Trainable params: 1,725
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.55e+03 | test_loss: nan | reg: 6.61e+01 | : 100%|███| 50/50 [00:53<00:00,  1.07s/it]

saving model version 0.1
Model: "sequential_165"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_704 (Dense)           (None, 15)                420       
                                                                 
 dense_705 (Dense)           (None, 32)                512       
                                                                 
 dense_706 (Dense)           (None, 19)                627       
                                                                 
 dense_707 (Dense)           (None, 27)                540       
                                                                 
 dense_708 (Dense)           (None, 26)                728       
                                                                 
 dense_709 (Dense)           (None, 1)                 27        
                                                                 
Total params: 2,854
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 6, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:20<00:00,  1.61s/it]

saving model version 0.1
ERROR ON SAMPLE 106
Model: "sequential_166"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_710 (Dense)           (None, 18)                504       
                                                                 
 dense_711 (Dense)           (None, 28)                532       
                                                                 
 dense_712 (Dense)           (None, 21)                609       
                                                                 
 dense_713 (Dense)           (None, 1)                 22        
                                                                 
Total params: 1,667
Trainable params: 1,667
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 5.42e+03 | test_loss: nan | reg: 7.42e+02 | : 100%|███| 50/50 [00:30<00:00,  1.63it/s]

saving model version 0.1
Model: "sequential_167"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_714 (Dense)           (None, 27)                756       
                                                                 
 dense_715 (Dense)           (None, 36)                1008      
                                                                 
 dense_716 (Dense)           (None, 1)                 37        
                                                                 
Total params: 1,801
Trainable params: 1,801
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 3.83e+01 | : 100%|███| 50/50 [00:14<00:00,  3.37it/s]

saving model version 0.1
Model: "sequential_168"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_717 (Dense)           (None, 49)                1372      
                                                                 
 dense_718 (Dense)           (None, 31)                1550      
                                                                 
 dense_719 (Dense)           (None, 35)                1120      
                                                                 
 dense_720 (Dense)           (None, 1)                 36        
                                                                 
Total params: 4,078
Trainable params: 4,078
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.76e+03 | test_loss: nan | reg: 4.97e+01 | : 100%|███| 50/50 [00:53<00:00,  1.07s/it]

saving model version 0.1
Model: "sequential_169"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_721 (Dense)           (None, 17)                476       
                                                                 
 dense_722 (Dense)           (None, 10)                180       
                                                                 
 dense_723 (Dense)           (None, 36)                396       
                                                                 
 dense_724 (Dense)           (None, 1)                 37        
                                                                 
Total params: 1,089
Trainable params: 1,089
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.13e+03 | test_loss: nan | reg: 4.50e+01 | : 100%|███| 50/50 [00:48<00:00,  1.03it/s]

saving model version 0.1
Model: "sequential_170"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_725 (Dense)           (None, 29)                812       
                                                                 
 dense_726 (Dense)           (None, 21)                630       
                                                                 
 dense_727 (Dense)           (None, 1)                 22        
                                                                 
Total params: 1,464
Trainable params: 1,464
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.06e+03 | test_loss: nan | reg: 4.07e+01 | : 100%|███| 50/50 [00:32<00:00,  1.53it/s]

saving model version 0.1
Model: "sequential_171"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_728 (Dense)           (None, 12)                336       
                                                                 
 dense_729 (Dense)           (None, 30)                390       
                                                                 
 dense_730 (Dense)           (None, 31)                961       
                                                                 
 dense_731 (Dense)           (None, 22)                704       
                                                                 
 dense_732 (Dense)           (None, 1)                 23        
                                                                 
Total params: 2,414
Trainable params: 2,414
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.26e+03 | test_loss: nan | reg: 7.88e+01 | : 100%|███| 50/50 [00:55<00:00,  1.11s/it]

saving model version 0.1
Model: "sequential_172"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_733 (Dense)           (None, 34)                952       
                                                                 
 dense_734 (Dense)           (None, 15)                525       
                                                                 
 dense_735 (Dense)           (None, 37)                592       
                                                                 
 dense_736 (Dense)           (None, 1)                 38        
                                                                 
Total params: 2,107
Trainable params: 2,107
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.12e+03 | test_loss: nan | reg: 4.61e+01 | : 100%|███| 50/50 [00:51<00:00,  1.03s/it]

saving model version 0.1
Model: "sequential_173"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_737 (Dense)           (None, 33)                924       
                                                                 
 dense_738 (Dense)           (None, 38)                1292      
                                                                 
 dense_739 (Dense)           (None, 14)                546       
                                                                 
 dense_740 (Dense)           (None, 1)                 15        
                                                                 
Total params: 2,777
Trainable params: 2,777
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 5.39e+03 | test_loss: nan | reg: 7.46e+02 | : 100%|███| 50/50 [00:29<00:00,  1.71it/s]

saving model version 0.1
Model: "sequential_174"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_741 (Dense)           (None, 16)                448       
                                                                 
 dense_742 (Dense)           (None, 7)                 119       
                                                                 
 dense_743 (Dense)           (None, 31)                248       
                                                                 
 dense_744 (Dense)           (None, 37)                1184      
                                                                 
 dense_745 (Dense)           (None, 1)                 38        
                                                                 
Total params: 2,037
Trainable params: 2,037
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 6, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.90e+03 | test_loss: nan | reg: 8.16e+01 | : 100%|███| 50/50 [01:08<00:00,  1.36s/it]

saving model version 0.1
Model: "sequential_175"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_746 (Dense)           (None, 13)                364       
                                                                 
 dense_747 (Dense)           (None, 19)                266       
                                                                 
 dense_748 (Dense)           (None, 1)                 20        
                                                                 
Total params: 650
Trainable params: 650
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.75e+03 | test_loss: nan | reg: 6.42e+01 | : 100%|███| 50/50 [00:34<00:00,  1.43it/s]

saving model version 0.1
Model: "sequential_176"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_749 (Dense)           (None, 21)                588       
                                                                 
 dense_750 (Dense)           (None, 1)                 22        
                                                                 
Total params: 610
Trainable params: 610
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.00e+02 | : 100%|███| 50/50 [00:07<00:00,  6.29it/s]

saving model version 0.1
Model: "sequential_177"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_751 (Dense)           (None, 31)                868       
                                                                 
 dense_752 (Dense)           (None, 27)                864       
                                                                 
 dense_753 (Dense)           (None, 15)                420       
                                                                 
 dense_754 (Dense)           (None, 1)                 16        
                                                                 
Total params: 2,168
Trainable params: 2,168
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.77e+03 | test_loss: nan | reg: 7.60e+01 | : 100%|███| 50/50 [00:52<00:00,  1.04s/it]

saving model version 0.1
Model: "sequential_178"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_755 (Dense)           (None, 37)                1036      
                                                                 
 dense_756 (Dense)           (None, 17)                646       
                                                                 
 dense_757 (Dense)           (None, 27)                486       
                                                                 
 dense_758 (Dense)           (None, 1)                 28        
                                                                 
Total params: 2,196
Trainable params: 2,196
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.15e+03 | test_loss: nan | reg: 4.19e+01 | : 100%|███| 50/50 [00:43<00:00,  1.14it/s]


saving model version 0.1
Model: "sequential_179"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_759 (Dense)           (None, 45)                1260      
                                                                 
 dense_760 (Dense)           (None, 48)                2208      
                                                                 
 dense_761 (Dense)           (None, 24)                1176      
                                                                 
 dense_762 (Dense)           (None, 1)                 25        
                                                                 
Total params: 4,669
Trainable params: 4,669
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.71e+03 | test_loss: nan | reg: 7.08e+01 | : 100%|███| 50/50 [00:51<00:00,  1.03s/it]

saving model version 0.1
Model: "sequential_180"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_763 (Dense)           (None, 22)                616       
                                                                 
 dense_764 (Dense)           (None, 21)                483       
                                                                 
 dense_765 (Dense)           (None, 37)                814       
                                                                 
 dense_766 (Dense)           (None, 1)                 38        
                                                                 
Total params: 1,951
Trainable params: 1,951
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.06e+03 | test_loss: nan | reg: 8.26e+01 | : 100%|███| 50/50 [00:54<00:00,  1.09s/it]

saving model version 0.1
Model: "sequential_181"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_767 (Dense)           (None, 17)                476       
                                                                 
 dense_768 (Dense)           (None, 8)                 144       
                                                                 
 dense_769 (Dense)           (None, 11)                99        
                                                                 
 dense_770 (Dense)           (None, 1)                 12        
                                                                 
Total params: 731
Trainable params: 731
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.91e+03 | test_loss: nan | reg: 6.30e+01 | : 100%|███| 50/50 [00:54<00:00,  1.08s/it]

saving model version 0.1
Model: "sequential_182"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_771 (Dense)           (None, 35)                980       
                                                                 
 dense_772 (Dense)           (None, 10)                360       
                                                                 
 dense_773 (Dense)           (None, 1)                 11        
                                                                 
Total params: 1,351
Trainable params: 1,351
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.35e+03 | test_loss: nan | reg: 8.15e+02 | : 100%|███| 50/50 [00:28<00:00,  1.78it/s]


saving model version 0.1
Model: "sequential_183"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_774 (Dense)           (None, 20)                560       
                                                                 
 dense_775 (Dense)           (None, 48)                1008      
                                                                 
 dense_776 (Dense)           (None, 18)                882       
                                                                 
 dense_777 (Dense)           (None, 1)                 19        
                                                                 
Total params: 2,469
Trainable params: 2,469
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 5.38e+01 | : 100%|███| 50/50 [00:38<00:00,  1.30it/s]

saving model version 0.1
Model: "sequential_184"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_778 (Dense)           (None, 25)                700       
                                                                 
 dense_779 (Dense)           (None, 28)                728       
                                                                 
 dense_780 (Dense)           (None, 1)                 29        
                                                                 
Total params: 1,457
Trainable params: 1,457
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.91e+03 | test_loss: nan | reg: 5.38e+01 | : 100%|███| 50/50 [00:31<00:00,  1.59it/s]

saving model version 0.1
Model: "sequential_185"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_781 (Dense)           (None, 39)                1092      
                                                                 
 dense_782 (Dense)           (None, 26)                1040      
                                                                 
 dense_783 (Dense)           (None, 1)                 27        
                                                                 
Total params: 2,159
Trainable params: 2,159
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.86e+03 | test_loss: nan | reg: 4.26e+01 | : 100%|███| 50/50 [00:26<00:00,  1.91it/s]

saving model version 0.1
Model: "sequential_186"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_784 (Dense)           (None, 25)                700       
                                                                 
 dense_785 (Dense)           (None, 19)                494       
                                                                 
 dense_786 (Dense)           (None, 1)                 20        
                                                                 
Total params: 1,214
Trainable params: 1,214
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.24e+03 | test_loss: nan | reg: 6.13e+01 | : 100%|███| 50/50 [00:30<00:00,  1.65it/s]

saving model version 0.1
Model: "sequential_187"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_787 (Dense)           (None, 31)                868       
                                                                 
 dense_788 (Dense)           (None, 12)                384       
                                                                 
 dense_789 (Dense)           (None, 38)                494       
                                                                 
 dense_790 (Dense)           (None, 1)                 39        
                                                                 
Total params: 1,785
Trainable params: 1,785
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.15e+03 | test_loss: nan | reg: 4.02e+01 | : 100%|███| 50/50 [00:38<00:00,  1.31it/s]

saving model version 0.1
Model: "sequential_188"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_791 (Dense)           (None, 30)                840       
                                                                 
 dense_792 (Dense)           (None, 1)                 31        
                                                                 
Total params: 871
Trainable params: 871
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.02e+02 | : 100%|███| 50/50 [00:08<00:00,  5.94it/s]

saving model version 0.1
Model: "sequential_189"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_793 (Dense)           (None, 17)                476       
                                                                 
 dense_794 (Dense)           (None, 27)                486       
                                                                 
 dense_795 (Dense)           (None, 25)                700       
                                                                 
 dense_796 (Dense)           (None, 1)                 26        
                                                                 
Total params: 1,688
Trainable params: 1,688
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.15e+03 | test_loss: nan | reg: 4.71e+01 | : 100%|███| 50/50 [00:48<00:00,  1.02it/s]

saving model version 0.1
Model: "sequential_190"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_797 (Dense)           (None, 27)                756       
                                                                 
 dense_798 (Dense)           (None, 12)                336       
                                                                 
 dense_799 (Dense)           (None, 29)                377       
                                                                 
 dense_800 (Dense)           (None, 1)                 30        
                                                                 
Total params: 1,499
Trainable params: 1,499
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.89e+03 | test_loss: nan | reg: 3.79e+01 | : 100%|███| 50/50 [00:32<00:00,  1.52it/s]


saving model version 0.1
Model: "sequential_191"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_801 (Dense)           (None, 38)                1064      
                                                                 
 dense_802 (Dense)           (None, 31)                1209      
                                                                 
 dense_803 (Dense)           (None, 1)                 32        
                                                                 
Total params: 2,305
Trainable params: 2,305
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 2.94e+01 | : 100%|███| 50/50 [00:32<00:00,  1.52it/s]

saving model version 0.1
Model: "sequential_192"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_804 (Dense)           (None, 23)                644       
                                                                 
 dense_805 (Dense)           (None, 21)                504       
                                                                 
 dense_806 (Dense)           (None, 1)                 22        
                                                                 
Total params: 1,170
Trainable params: 1,170
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 8.13e+01 | : 100%|███| 50/50 [00:12<00:00,  3.91it/s]

saving model version 0.1
Model: "sequential_193"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_807 (Dense)           (None, 38)                1064      
                                                                 
 dense_808 (Dense)           (None, 28)                1092      
                                                                 
 dense_809 (Dense)           (None, 28)                812       
                                                                 
 dense_810 (Dense)           (None, 1)                 29        
                                                                 
Total params: 2,997
Trainable params: 2,997
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.34e+03 | test_loss: nan | reg: 8.31e+01 | : 100%|███| 50/50 [00:51<00:00,  1.03s/it]

saving model version 0.1
Model: "sequential_194"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_811 (Dense)           (None, 37)                1036      
                                                                 
 dense_812 (Dense)           (None, 22)                836       
                                                                 
 dense_813 (Dense)           (None, 1)                 23        
                                                                 
Total params: 1,895
Trainable params: 1,895
Non-trainable params: 0





_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 4.16e+02 | : 100%|███| 50/50 [00:19<00:00,  2.61it/s]

saving model version 0.1
Model: "sequential_195"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_814 (Dense)           (None, 23)                644       
                                                                 
 dense_815 (Dense)           (None, 21)                504       
                                                                 
 dense_816 (Dense)           (None, 12)                264       
                                                                 
 dense_817 (Dense)           (None, 1)                 13        
                                                                 
Total params: 1,425
Trainable params: 1,425
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 3.31e+01 | : 100%|███| 50/50 [00:26<00:00,  1.89it/s]

saving model version 0.1
Model: "sequential_196"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_818 (Dense)           (None, 36)                1008      
                                                                 
 dense_819 (Dense)           (None, 18)                666       
                                                                 
 dense_820 (Dense)           (None, 35)                665       
                                                                 
 dense_821 (Dense)           (None, 35)                1260      





                                                                 
 dense_822 (Dense)           (None, 1)                 36        
                                                                 
Total params: 3,635
Trainable params: 3,635
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 4.40e+01 | : 100%|███| 50/50 [00:54<00:00,  1.09s/it]

saving model version 0.1
Model: "sequential_197"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_823 (Dense)           (None, 35)                980       
                                                                 
 dense_824 (Dense)           (None, 24)                864       
                                                                 
 dense_825 (Dense)           (None, 20)                500       
                                                                 
 dense_826 (Dense)           (None, 33)                693       
                                                                 
 dense_827 (Dense)           (None, 1)                 34        
                                                                 
Total params: 3,071
Trainable params: 3,071
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.59e+03 | test_loss: nan | reg: 2.56e+02 | : 100%|███| 50/50 [00:27<00:00,  1.81it/s]

saving model version 0.1
Model: "sequential_198"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_828 (Dense)           (None, 24)                672       
                                                                 
 dense_829 (Dense)           (None, 22)                550       
                                                                 
 dense_830 (Dense)           (None, 17)                391       
                                                                 
 dense_831 (Dense)           (None, 23)                414       
                                                                 
 dense_832 (Dense)           (None, 17)                408       
                                                                 
 dense_833 (Dense)           (None, 1)                 18        
                                                                 
Total params: 2,453
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:24<00:00,  1.69s/it]

saving model version 0.1
ERROR ON SAMPLE 139
Model: "sequential_199"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_834 (Dense)           (None, 28)                784       
                                                                 
 dense_835 (Dense)           (None, 17)                493       
                                                                 
 dense_836 (Dense)           (None, 35)                630       
                                                                 
 dense_837 (Dense)           (None, 1)                 36        
                                                                 
Total params: 1,943
Trainable params: 1,943
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.32e+03 | test_loss: nan | reg: 4.50e+01 | : 100%|███| 50/50 [00:26<00:00,  1.91it/s]

saving model version 0.1
Model: "sequential_200"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_838 (Dense)           (None, 33)                924       
                                                                 
 dense_839 (Dense)           (None, 20)                680       
                                                                 





 dense_840 (Dense)           (None, 30)                630       
                                                                 
 dense_841 (Dense)           (None, 1)                 31        
                                                                 
Total params: 2,265
Trainable params: 2,265
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.65e+03 | test_loss: nan | reg: 5.64e+02 | : 100%|███| 50/50 [00:24<00:00,  2.06it/s]

saving model version 0.1
Model: "sequential_201"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_842 (Dense)           (None, 34)                952       
                                                                 
 dense_843 (Dense)           (None, 30)                1050      
                                                                 
 dense_844 (Dense)           (None, 22)                682       
                                                                 
 dense_845 (Dense)           (None, 1)                 23        
                                                                 
Total params: 2,707
Trainable params: 2,707
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.20e+03 | test_loss: nan | reg: 5.02e+01 | : 100%|███| 50/50 [00:42<00:00,  1.19it/s]

saving model version 0.1
Model: "sequential_202"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_846 (Dense)           (None, 37)                1036      
                                                                 
 dense_847 (Dense)           (None, 15)                570       
                                                                 
 dense_848 (Dense)           (None, 1)                 16        
                                                                 
Total params: 1,622
Trainable params: 1,622
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.91e+03 | test_loss: nan | reg: 6.91e+01 | : 100%|███| 50/50 [00:41<00:00,  1.21it/s]

saving model version 0.1
Model: "sequential_203"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_849 (Dense)           (None, 24)                672       
                                                                 
 dense_850 (Dense)           (None, 44)                1100      
                                                                 
 dense_851 (Dense)           (None, 1)                 45        
                                                                 
Total params: 1,817
Trainable params: 1,817
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.08e+03 | test_loss: nan | reg: 3.82e+01 | : 100%|███| 50/50 [00:35<00:00,  1.39it/s]

saving model version 0.1
Model: "sequential_204"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_852 (Dense)           (None, 26)                728       
                                                                 
 dense_853 (Dense)           (None, 32)                864       
                                                                 
 dense_854 (Dense)           (None, 1)                 33        
                                                                 
Total params: 1,625
Trainable params: 1,625
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.18e+03 | test_loss: nan | reg: 2.89e+02 | : 100%|███| 50/50 [00:18<00:00,  2.71it/s]

saving model version 0.1
Model: "sequential_205"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_855 (Dense)           (None, 25)                700       
                                                                 
 dense_856 (Dense)           (None, 16)                416       
                                                                 
 dense_857 (Dense)           (None, 22)                374       
                                                                 
 dense_858 (Dense)           (None, 32)                736       
                                                                 
 dense_859 (Dense)           (None, 27)                891       
                                                                 
 dense_860 (Dense)           (None, 1)                 28        
                                                                 
Total params: 3,145
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 2, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.68e+03 | test_loss: nan | reg: 6.36e+01 | : 100%|███| 50/50 [01:18<00:00,  1.58s/it]

saving model version 0.1
Model: "sequential_206"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_861 (Dense)           (None, 11)                308       
                                                                 
 dense_862 (Dense)           (None, 23)                276       
                                                                 
 dense_863 (Dense)           (None, 19)                456       
                                                                 
 dense_864 (Dense)           (None, 34)                680       
                                                                 
 dense_865 (Dense)           (None, 1)                 35        
                                                                 
Total params: 1,755
Trainable params: 1,755
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 7, 6, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.03e+03 | test_loss: nan | reg: 9.24e+01 | : 100%|███| 50/50 [01:18<00:00,  1.56s/it]

saving model version 0.1
Model: "sequential_207"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_866 (Dense)           (None, 27)                756       
                                                                 
 dense_867 (Dense)           (None, 38)                1064      
                                                                 
 dense_868 (Dense)           (None, 1)                 39        
                                                                 
Total params: 1,859
Trainable params: 1,859
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 7.80e+01 | : 100%|███| 50/50 [00:16<00:00,  3.00it/s]

saving model version 0.1
Model: "sequential_208"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_869 (Dense)           (None, 26)                728       
                                                                 
 dense_870 (Dense)           (None, 12)                324       
                                                                 
 dense_871 (Dense)           (None, 27)                351       
                                                                 
 dense_872 (Dense)           (None, 1)                 28        
                                                                 
Total params: 1,431
Trainable params: 1,431
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 5.91e+04 | : 100%|███| 50/50 [00:35<00:00,  1.41it/s]

saving model version 0.1
Model: "sequential_209"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_873 (Dense)           (None, 29)                812       





                                                                 
 dense_874 (Dense)           (None, 31)                930       
                                                                 
 dense_875 (Dense)           (None, 44)                1408      
                                                                 
 dense_876 (Dense)           (None, 1)                 45        
                                                                 
Total params: 3,195
Trainable params: 3,195
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.62e+03 | test_loss: nan | reg: 5.79e+01 | : 100%|███| 50/50 [00:45<00:00,  1.11it/s]

saving model version 0.1
Model: "sequential_210"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_877 (Dense)           (None, 30)                840       
                                                                 
 dense_878 (Dense)           (None, 19)                589       
                                                                 
 dense_879 (Dense)           (None, 1)                 20        
                                                                 
Total params: 1,449
Trainable params: 1,449
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.66e+03 | test_loss: nan | reg: 5.85e+01 | : 100%|███| 50/50 [00:37<00:00,  1.34it/s]

saving model version 0.1
Model: "sequential_211"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_880 (Dense)           (None, 23)                644       
                                                                 
 dense_881 (Dense)           (None, 8)                 192       
                                                                 
 dense_882 (Dense)           (None, 20)                180       
                                                                 
 dense_883 (Dense)           (None, 1)                 21        
                                                                 
Total params: 1,037
Trainable params: 1,037
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.31e+03 | test_loss: nan | reg: 5.87e+02 | : 100%|███| 50/50 [00:34<00:00,  1.45it/s]

saving model version 0.1
Model: "sequential_212"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_884 (Dense)           (None, 13)                364       
                                                                 
 dense_885 (Dense)           (None, 25)                350       
                                                                 
 dense_886 (Dense)           (None, 25)                650       
                                                                 
 dense_887 (Dense)           (None, 1)                 26        
                                                                 
Total params: 1,390
Trainable params: 1,390
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.10e+03 | test_loss: nan | reg: 8.96e+01 | : 100%|███| 50/50 [00:47<00:00,  1.06it/s]

saving model version 0.1
Model: "sequential_213"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_888 (Dense)           (None, 26)                728       
                                                                 
 dense_889 (Dense)           (None, 27)                729       
                                                                 
 dense_890 (Dense)           (None, 41)                1148      
                                                                 
 dense_891 (Dense)           (None, 36)                1512      
                                                                 
 dense_892 (Dense)           (None, 22)                814       
                                                                 
 dense_893 (Dense)           (None, 1)                 23        
                                                                 
Total params: 4,954
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.21e+03 | test_loss: nan | reg: 8.04e+01 | : 100%|███| 50/50 [01:02<00:00,  1.26s/it]

saving model version 0.1
Model: "sequential_214"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_894 (Dense)           (None, 27)                756       
                                                                 
 dense_895 (Dense)           (None, 14)                392       
                                                                 
 dense_896 (Dense)           (None, 9)                 135       
                                                                 
 dense_897 (Dense)           (None, 1)                 10        
                                                                 
 dense_898 (Dense)           (None, 1)                 2         
                                                                 
Total params: 1,295
Trainable params: 1,295
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.50e+02 | : 100%|███| 50/50 [00:34<00:00,  1.45it/s]


saving model version 0.1
Model: "sequential_215"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_899 (Dense)           (None, 7)                 196       
                                                                 
 dense_900 (Dense)           (None, 19)                152       
                                                                 
 dense_901 (Dense)           (None, 24)                480       
                                                                 
 dense_902 (Dense)           (None, 31)                775       
                                                                 
 dense_903 (Dense)           (None, 1)                 32        
                                                                 
Total params: 1,635
Trainable params: 1,635
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/1

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.87e+03 | test_loss: nan | reg: 5.36e+01 | : 100%|███| 50/50 [01:00<00:00,  1.20s/it]

saving model version 0.1
Model: "sequential_216"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_904 (Dense)           (None, 38)                1064      
                                                                 
 dense_905 (Dense)           (None, 16)                624       
                                                                 
 dense_906 (Dense)           (None, 39)                663       
                                                                 
 dense_907 (Dense)           (None, 1)                 40        
                                                                 
Total params: 2,391
Trainable params: 2,391
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.72e+03 | test_loss: nan | reg: 4.63e+01 | : 100%|███| 50/50 [00:44<00:00,  1.11it/s]

saving model version 0.1
Model: "sequential_217"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_908 (Dense)           (None, 47)                1316      
                                                                 
 dense_909 (Dense)           (None, 31)                1488      
                                                                 
 dense_910 (Dense)           (None, 35)                1120      
                                                                 
 dense_911 (Dense)           (None, 32)                1152      
                                                                 
 dense_912 (Dense)           (None, 1)                 33        
                                                                 
Total params: 5,109
Trainable params: 5,109
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.07e+03 | test_loss: nan | reg: 8.69e+01 | : 100%|███| 50/50 [01:03<00:00,  1.28s/it]

saving model version 0.1
Model: "sequential_218"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_913 (Dense)           (None, 31)                868       
                                                                 
 dense_914 (Dense)           (None, 13)                416       
                                                                 
 dense_915 (Dense)           (None, 1)                 14        
                                                                 
Total params: 1,298
Trainable params: 1,298
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.10e+03 | test_loss: nan | reg: 4.31e+01 | : 100%|███| 50/50 [00:30<00:00,  1.65it/s]

saving model version 0.1
Model: "sequential_219"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_916 (Dense)           (None, 34)                952       
                                                                 
 dense_917 (Dense)           (None, 16)                560       
                                                                 
 dense_918 (Dense)           (None, 31)                527       
                                                                 
 dense_919 (Dense)           (None, 1)                 32        
                                                                 
Total params: 2,071
Trainable params: 2,071
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.16e+03 | test_loss: nan | reg: 2.12e+02 | : 100%|███| 50/50 [00:51<00:00,  1.03s/it]

saving model version 0.1
Model: "sequential_220"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_920 (Dense)           (None, 30)                840       
                                                                 
 dense_921 (Dense)           (None, 23)                713       
                                                                 
 dense_922 (Dense)           (None, 12)                288       
                                                                 
 dense_923 (Dense)           (None, 1)                 13        
                                                                 
Total params: 1,854
Trainable params: 1,854
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 1.52e+02 | : 100%|███| 50/50 [00:38<00:00,  1.30it/s]

saving model version 0.1
Model: "sequential_221"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_924 (Dense)           (None, 17)                476       
                                                                 
 dense_925 (Dense)           (None, 32)                576       
                                                                 
 dense_926 (Dense)           (None, 26)                858       
                                                                 
 dense_927 (Dense)           (None, 35)                945       
                                                                 
 dense_928 (Dense)           (None, 1)                 36        
                                                                 
Total params: 2,891
Trainable params: 2,891
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.31e+03 | test_loss: nan | reg: 2.00e+02 | : 100%|███| 50/50 [00:45<00:00,  1.11it/s]

saving model version 0.1
Model: "sequential_222"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_929 (Dense)           (None, 44)                1232      
                                                                 
 dense_930 (Dense)           (None, 21)                945       
                                                                 
 dense_931 (Dense)           (None, 39)                858       
                                                                 
 dense_932 (Dense)           (None, 1)                 40        
                                                                 
Total params: 3,075
Trainable params: 3,075
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 5.17e+01 | : 100%|███| 50/50 [00:35<00:00,  1.40it/s]

saving model version 0.1
Model: "sequential_223"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_933 (Dense)           (None, 15)                420       
                                                                 
 dense_934 (Dense)           (None, 19)                304       
                                                                 
 dense_935 (Dense)           (None, 1)                 20        
                                                                 
Total params: 744
Trainable params: 744
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.20e+03 | test_loss: nan | reg: 4.25e+01 | : 100%|███| 50/50 [00:37<00:00,  1.35it/s]

saving model version 0.1
Model: "sequential_224"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_936 (Dense)           (None, 36)                1008      
                                                                 
 dense_937 (Dense)           (None, 30)                1110      
                                                                 
 dense_938 (Dense)           (None, 32)                992       
                                                                 
 dense_939 (Dense)           (None, 1)                 33        
                                                                 
Total params: 3,143
Trainable params: 3,143
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 6.04e+01 | : 100%|███| 50/50 [00:41<00:00,  1.20it/s]

saving model version 0.1
Model: "sequential_225"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_940 (Dense)           (None, 20)                560       
                                                                 
 dense_941 (Dense)           (None, 39)                819       
                                                                 
 dense_942 (Dense)           (None, 33)                1320      
                                                                 
 dense_943 (Dense)           (None, 24)                816       
                                                                 
 dense_944 (Dense)           (None, 1)                 25        
                                                                 
Total params: 3,540
Trainable params: 3,540
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 2, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.96e+03 | test_loss: nan | reg: 7.78e+01 | : 100%|███| 50/50 [01:02<00:00,  1.25s/it]

saving model version 0.1
Model: "sequential_226"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_945 (Dense)           (None, 16)                448       
                                                                 
 dense_946 (Dense)           (None, 25)                425       
                                                                 
 dense_947 (Dense)           (None, 1)                 26        
                                                                 
Total params: 899
Trainable params: 899
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 4.35e+01 | : 100%|███| 50/50 [00:31<00:00,  1.58it/s]

saving model version 0.1
Model: "sequential_227"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_948 (Dense)           (None, 50)                1400      
                                                                 
 dense_949 (Dense)           (None, 13)                663       
                                                                 
 dense_950 (Dense)           (None, 35)                490       
                                                                 
 dense_951 (Dense)           (None, 42)                1512      
                                                                 
 dense_952 (Dense)           (None, 1)                 43        
                                                                 
Total params: 4,108
Trainable params: 4,108
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.13e+03 | test_loss: nan | reg: 4.87e+01 | : 100%|███| 50/50 [01:05<00:00,  1.30s/it]

saving model version 0.1
Model: "sequential_228"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_953 (Dense)           (None, 28)                784       
                                                                 
 dense_954 (Dense)           (None, 27)                783       
                                                                 
 dense_955 (Dense)           (None, 25)                700       
                                                                 
 dense_956 (Dense)           (None, 18)                468       
                                                                 
 dense_957 (Dense)           (None, 1)                 19        
                                                                 
Total params: 2,754
Trainable params: 2,754
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 6, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.16e+03 | test_loss: nan | reg: 5.21e+01 | : 100%|███| 50/50 [00:49<00:00,  1.01it/s]


saving model version 0.1
Model: "sequential_229"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_958 (Dense)           (None, 7)                 196       
                                                                 
 dense_959 (Dense)           (None, 50)                400       
                                                                 
 dense_960 (Dense)           (None, 32)                1632      
                                                                 
 dense_961 (Dense)           (None, 1)                 33        
                                                                 
Total params: 2,261
Trainable params: 2,261
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.23e+03 | test_loss: nan | reg: 4.98e+01 | : 100%|███| 50/50 [00:48<00:00,  1.02it/s]

saving model version 0.1
Model: "sequential_230"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_962 (Dense)           (None, 28)                784       
                                                                 
 dense_963 (Dense)           (None, 28)                812       
                                                                 
 dense_964 (Dense)           (None, 20)                580       
                                                                 
 dense_965 (Dense)           (None, 37)                777       
                                                                 
 dense_966 (Dense)           (None, 1)                 38        
                                                                 
Total params: 2,991
Trainable params: 2,991
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 6, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.16e+03 | test_loss: nan | reg: 6.16e+01 | : 100%|███| 50/50 [01:06<00:00,  1.33s/it]

saving model version 0.1
Model: "sequential_231"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_967 (Dense)           (None, 13)                364       
                                                                 
 dense_968 (Dense)           (None, 28)                392       
                                                                 
 dense_969 (Dense)           (None, 13)                377       
                                                                 
 dense_970 (Dense)           (None, 9)                 126       
                                                                 
 dense_971 (Dense)           (None, 1)                 10        
                                                                 
Total params: 1,269
Trainable params: 1,269
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 6.09e+01 | : 100%|███| 50/50 [00:35<00:00,  1.42it/s]

saving model version 0.1
Model: "sequential_232"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_972 (Dense)           (None, 20)                560       
                                                                 
 dense_973 (Dense)           (None, 32)                672       
                                                                 
 dense_974 (Dense)           (None, 31)                1023      
                                                                 
 dense_975 (Dense)           (None, 1)                 32        
                                                                 
Total params: 2,287
Trainable params: 2,287
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.16e+03 | test_loss: nan | reg: 4.78e+01 | : 100%|███| 50/50 [00:50<00:00,  1.00s/it]

saving model version 0.1
Model: "sequential_233"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_976 (Dense)           (None, 24)                672       
                                                                 
 dense_977 (Dense)           (None, 19)                475       
                                                                 
 dense_978 (Dense)           (None, 25)                500       
                                                                 
 dense_979 (Dense)           (None, 31)                806       
                                                                 
 dense_980 (Dense)           (None, 1)                 32        
                                                                 
Total params: 2,485
Trainable params: 2,485
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 2.69e+02 | : 100%|███| 50/50 [00:38<00:00,  1.30it/s]

saving model version 0.1
Model: "sequential_234"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_981 (Dense)           (None, 33)                924       
                                                                 
 dense_982 (Dense)           (None, 34)                1156      
                                                                 
 dense_983 (Dense)           (None, 1)                 35        
                                                                 
Total params: 2,115
Trainable params: 2,115
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 5.12e+03 | test_loss: nan | reg: 8.88e+02 | : 100%|███| 50/50 [00:33<00:00,  1.51it/s]

saving model version 0.1
Model: "sequential_235"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_984 (Dense)           (None, 19)                532       
                                                                 
 dense_985 (Dense)           (None, 19)                380       
                                                                 
 dense_986 (Dense)           (None, 1)                 20        
                                                                 
Total params: 932
Trainable params: 932
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.17e+03 | test_loss: nan | reg: 7.19e+01 | : 100%|███| 50/50 [00:33<00:00,  1.51it/s]

saving model version 0.1
Model: "sequential_236"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_987 (Dense)           (None, 25)                700       
                                                                 
 dense_988 (Dense)           (None, 23)                598       
                                                                 
 dense_989 (Dense)           (None, 11)                264       
                                                                 
 dense_990 (Dense)           (None, 29)                348       
                                                                 
 dense_991 (Dense)           (None, 1)                 30        
                                                                 
Total params: 1,940
Trainable params: 1,940
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 2, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.23e+03 | test_loss: nan | reg: 6.79e+01 | : 100%|███| 50/50 [01:05<00:00,  1.31s/it]

saving model version 0.1
Model: "sequential_237"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_992 (Dense)           (None, 25)                700       
                                                                 
 dense_993 (Dense)           (None, 34)                884       
                                                                 
 dense_994 (Dense)           (None, 1)                 35        
                                                                 
Total params: 1,619
Trainable params: 1,619
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.26e+03 | test_loss: nan | reg: 3.50e+01 | : 100%|███| 50/50 [00:36<00:00,  1.39it/s]

saving model version 0.1
Model: "sequential_238"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_995 (Dense)           (None, 26)                728       
                                                                 
 dense_996 (Dense)           (None, 29)                783       
                                                                 
 dense_997 (Dense)           (None, 9)                 270       
                                                                 
 dense_998 (Dense)           (None, 1)                 10        
                                                                 
Total params: 1,791
Trainable params: 1,791
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 5.52e+01 | : 100%|███| 50/50 [00:51<00:00,  1.03s/it]

saving model version 0.1
Model: "sequential_239"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_999 (Dense)           (None, 26)                728       
                                                                 
 dense_1000 (Dense)          (None, 33)                891       
                                                                 
 dense_1001 (Dense)          (None, 1)                 34        
                                                                 
Total params: 1,653
Trainable params: 1,653
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.20e+03 | test_loss: nan | reg: 3.36e+01 | : 100%|███| 50/50 [00:29<00:00,  1.69it/s]

saving model version 0.1
Model: "sequential_240"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1002 (Dense)          (None, 26)                728       
                                                                 
 dense_1003 (Dense)          (None, 39)                1053      
                                                                 
 dense_1004 (Dense)          (None, 1)                 40        
                                                                 
Total params: 1,821
Trainable params: 1,821
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.87e+03 | test_loss: nan | reg: 4.61e+01 | : 100%|███| 50/50 [00:28<00:00,  1.76it/s]


saving model version 0.1
Model: "sequential_241"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1005 (Dense)          (None, 22)                616       
                                                                 
 dense_1006 (Dense)          (None, 36)                828       
                                                                 
 dense_1007 (Dense)          (None, 31)                1147      
                                                                 
 dense_1008 (Dense)          (None, 1)                 32        
                                                                 
Total params: 2,623
Trainable params: 2,623
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.99e+03 | test_loss: nan | reg: 5.13e+01 | : 100%|███| 50/50 [00:52<00:00,  1.05s/it]

saving model version 0.1
Model: "sequential_242"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1009 (Dense)          (None, 35)                980       
                                                                 
 dense_1010 (Dense)          (None, 14)                504       
                                                                 
 dense_1011 (Dense)          (None, 14)                210       
                                                                 
 dense_1012 (Dense)          (None, 1)                 15        
                                                                 
Total params: 1,709
Trainable params: 1,709
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.85e+03 | test_loss: nan | reg: 1.23e+02 | : 100%|███| 50/50 [00:51<00:00,  1.03s/it]

saving model version 0.1
Model: "sequential_243"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1013 (Dense)          (None, 17)                476       
                                                                 
 dense_1014 (Dense)          (None, 23)                414       
                                                                 
 dense_1015 (Dense)          (None, 43)                1032      
                                                                 
 dense_1016 (Dense)          (None, 1)                 44        
                                                                 
Total params: 1,966
Trainable params: 1,966
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.48e+03 | test_loss: nan | reg: 7.45e+01 | : 100%|███| 50/50 [00:52<00:00,  1.05s/it]

saving model version 0.1
Model: "sequential_244"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1017 (Dense)          (None, 14)                392       
                                                                 
 dense_1018 (Dense)          (None, 14)                210       
                                                                 
 dense_1019 (Dense)          (None, 18)                270       
                                                                 
 dense_1020 (Dense)          (None, 1)                 19        
                                                                 
Total params: 891
Trainable params: 891
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 4.37e+01 | : 100%|███| 50/50 [00:24<00:00,  2.06it/s]


saving model version 0.1
Model: "sequential_245"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1021 (Dense)          (None, 30)                840       
                                                                 
 dense_1022 (Dense)          (None, 26)                806       
                                                                 
 dense_1023 (Dense)          (None, 39)                1053      
                                                                 
 dense_1024 (Dense)          (None, 17)                680       
                                                                 
 dense_1025 (Dense)          (None, 26)                468       
                                                                 
 dense_1026 (Dense)          (None, 1)                 27        
                                                                 
Total params: 3,874
Trainab

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 6.89e+01 | : 100%|███| 50/50 [00:39<00:00,  1.25it/s]

saving model version 0.1
Model: "sequential_246"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1027 (Dense)          (None, 3)                 84        
                                                                 
 dense_1028 (Dense)          (None, 21)                84        
                                                                 
 dense_1029 (Dense)          (None, 31)                682       
                                                                 
 dense_1030 (Dense)          (None, 24)                768       
                                                                 
 dense_1031 (Dense)          (None, 1)                 25        
                                                                 
Total params: 1,643
Trainable params: 1,643
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:12<00:00,  1.44s/it]

saving model version 0.1
ERROR ON SAMPLE 187
Model: "sequential_247"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1032 (Dense)          (None, 26)                728       
                                                                 
 dense_1033 (Dense)          (None, 30)                810       
                                                                 
 dense_1034 (Dense)          (None, 35)                1085      
                                                                 
 dense_1035 (Dense)          (None, 12)                432       
                                                                 
 dense_1036 (Dense)          (None, 1)                 13        
                                                                 
Total params: 3,068
Trainable params: 3,068
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.90e+02 | : 100%|███| 50/50 [00:26<00:00,  1.91it/s]

saving model version 0.1
Model: "sequential_248"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1037 (Dense)          (None, 13)                364       
                                                                 
 dense_1038 (Dense)          (None, 1)                 14        
                                                                 
Total params: 378
Trainable params: 378
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.26e+03 | test_loss: nan | reg: 1.35e+02 | : 100%|███| 50/50 [00:10<00:00,  4.76it/s]

saving model version 0.1
Model: "sequential_249"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1039 (Dense)          (None, 39)                1092      
                                                                 
 dense_1040 (Dense)          (None, 35)                1400      
                                                                 
 dense_1041 (Dense)          (None, 28)                1008      
                                                                 
 dense_1042 (Dense)          (None, 25)                725       
                                                                 
 dense_1043 (Dense)          (None, 1)                 26        
                                                                 
Total params: 4,251
Trainable params: 4,251
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.64e+03 | test_loss: nan | reg: 5.80e+01 | : 100%|███| 50/50 [01:02<00:00,  1.26s/it]

saving model version 0.1
Model: "sequential_250"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1044 (Dense)          (None, 28)                784       
                                                                 
 dense_1045 (Dense)          (None, 1)                 29        
                                                                 
Total params: 813
Trainable params: 813
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.02e+02 | : 100%|███| 50/50 [00:06<00:00,  7.24it/s]


saving model version 0.1
Model: "sequential_251"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1046 (Dense)          (None, 38)                1064      
                                                                 
 dense_1047 (Dense)          (None, 24)                936       
                                                                 
 dense_1048 (Dense)          (None, 1)                 25        
                                                                 
Total params: 2,025
Trainable params: 2,025
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.58e+03 | test_loss: nan | reg: 8.25e+02 | : 100%|███| 50/50 [00:33<00:00,  1.50it/s]

saving model version 0.1
Model: "sequential_252"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1049 (Dense)          (None, 15)                420       
                                                                 
 dense_1050 (Dense)          (None, 23)                368       
                                                                 
 dense_1051 (Dense)          (None, 37)                888       
                                                                 
 dense_1052 (Dense)          (None, 31)                1178      
                                                                 
 dense_1053 (Dense)          (None, 15)                480       
                                                                 
 dense_1054 (Dense)          (None, 1)                 16        
                                                                 
Total params: 3,350
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.32e+03 | test_loss: nan | reg: 1.61e+02 | : 100%|███| 50/50 [00:59<00:00,  1.19s/it]

saving model version 0.1
Model: "sequential_253"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1055 (Dense)          (None, 47)                1316      
                                                                 
 dense_1056 (Dense)          (None, 34)                1632      
                                                                 
 dense_1057 (Dense)          (None, 13)                455       
                                                                 
 dense_1058 (Dense)          (None, 38)                532       
                                                                 
 dense_1059 (Dense)          (None, 1)                 39        
                                                                 
Total params: 3,974
Trainable params: 3,974
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.48e+03 | test_loss: nan | reg: 6.78e+01 | : 100%|███| 50/50 [01:06<00:00,  1.32s/it]

saving model version 0.1
Model: "sequential_254"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1060 (Dense)          (None, 6)                 168       
                                                                 
 dense_1061 (Dense)          (None, 31)                217       
                                                                 
 dense_1062 (Dense)          (None, 24)                768       
                                                                 
 dense_1063 (Dense)          (None, 12)                300       
                                                                 
 dense_1064 (Dense)          (None, 1)                 13        
                                                                 
Total params: 1,466
Trainable params: 1,466
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.28e+03 | test_loss: nan | reg: 4.51e+01 | : 100%|███| 50/50 [00:45<00:00,  1.09it/s]

saving model version 0.1
Model: "sequential_255"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1065 (Dense)          (None, 42)                1176      
                                                                 
 dense_1066 (Dense)          (None, 27)                1161      
                                                                 
 dense_1067 (Dense)          (None, 42)                1176      
                                                                 
 dense_1068 (Dense)          (None, 22)                946       
                                                                 
 dense_1069 (Dense)          (None, 1)                 23        
                                                                 
Total params: 4,482
Trainable params: 4,482
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.90e+03 | test_loss: nan | reg: 7.87e+01 | : 100%|███| 50/50 [01:04<00:00,  1.30s/it]

saving model version 0.1
Model: "sequential_256"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1070 (Dense)          (None, 29)                812       
                                                                 
 dense_1071 (Dense)          (None, 35)                1050      
                                                                 
 dense_1072 (Dense)          (None, 35)                1260      
                                                                 
 dense_1073 (Dense)          (None, 1)                 36        
                                                                 
Total params: 3,158
Trainable params: 3,158
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.16e+03 | test_loss: nan | reg: 4.06e+01 | : 100%|███| 50/50 [00:48<00:00,  1.03it/s]

saving model version 0.1
Model: "sequential_257"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1074 (Dense)          (None, 26)                728       
                                                                 
 dense_1075 (Dense)          (None, 23)                621       
                                                                 
 dense_1076 (Dense)          (None, 4)                 96        
                                                                 
 dense_1077 (Dense)          (None, 1)                 5         
                                                                 
Total params: 1,450
Trainable params: 1,450
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.53e+03 | test_loss: nan | reg: 1.80e+04 | : 100%|███| 50/50 [00:37<00:00,  1.32it/s]

saving model version 0.1
Model: "sequential_258"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1078 (Dense)          (None, 22)                616       
                                                                 
 dense_1079 (Dense)          (None, 7)                 161       
                                                                 
 dense_1080 (Dense)          (None, 36)                288       
                                                                 
 dense_1081 (Dense)          (None, 22)                814       
                                                                 
 dense_1082 (Dense)          (None, 1)                 23        
                                                                 
Total params: 1,902
Trainable params: 1,902
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 2, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 5.20e+03 | test_loss: nan | reg: 6.41e+01 | : 100%|███| 50/50 [01:07<00:00,  1.34s/it]


saving model version 0.1
Model: "sequential_259"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1083 (Dense)          (None, 44)                1232      
                                                                 
 dense_1084 (Dense)          (None, 23)                1035      
                                                                 
 dense_1085 (Dense)          (None, 1)                 24        
                                                                 
Total params: 2,291
Trainable params: 2,291
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.85e+03 | test_loss: nan | reg: 5.67e+01 | : 100%|███| 50/50 [00:30<00:00,  1.62it/s]

saving model version 0.1
Model: "sequential_260"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1086 (Dense)          (None, 20)                560       
                                                                 
 dense_1087 (Dense)          (None, 29)                609       
                                                                 
 dense_1088 (Dense)          (None, 29)                870       
                                                                 
 dense_1089 (Dense)          (None, 1)                 30        
                                                                 
Total params: 2,069
Trainable params: 2,069
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 2.95e+01 | : 100%|███| 50/50 [00:34<00:00,  1.46it/s]

saving model version 0.1
Model: "sequential_261"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1090 (Dense)          (None, 16)                448       
                                                                 
 dense_1091 (Dense)          (None, 27)                459       
                                                                 
 dense_1092 (Dense)          (None, 1)                 28        
                                                                 
Total params: 935
Trainable params: 935
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.27e+03 | test_loss: nan | reg: 2.42e+01 | : 100%|███| 50/50 [00:24<00:00,  2.01it/s]

saving model version 0.1
Model: "sequential_262"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1093 (Dense)          (None, 29)                812       
                                                                 
 dense_1094 (Dense)          (None, 17)                510       
                                                                 
 dense_1095 (Dense)          (None, 27)                486       
                                                                 
 dense_1096 (Dense)          (None, 1)                 28        
                                                                 
Total params: 1,836
Trainable params: 1,836
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.67e+03 | test_loss: nan | reg: 7.43e+01 | : 100%|███| 50/50 [00:51<00:00,  1.04s/it]

saving model version 0.1
Model: "sequential_263"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1097 (Dense)          (None, 31)                868       
                                                                 
 dense_1098 (Dense)          (None, 29)                928       
                                                                 
 dense_1099 (Dense)          (None, 9)                 270       
                                                                 
 dense_1100 (Dense)          (None, 1)                 10        
                                                                 
Total params: 2,076
Trainable params: 2,076
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.66e+03 | test_loss: nan | reg: 5.46e+01 | : 100%|███| 50/50 [00:43<00:00,  1.14it/s]

saving model version 0.1
Model: "sequential_264"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1101 (Dense)          (None, 30)                840       
                                                                 
 dense_1102 (Dense)          (None, 32)                992       
                                                                 
 dense_1103 (Dense)          (None, 11)                363       
                                                                 
 dense_1104 (Dense)          (None, 1)                 12        
                                                                 
Total params: 2,207
Trainable params: 2,207
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.65e+03 | test_loss: nan | reg: 6.33e+01 | : 100%|███| 50/50 [00:57<00:00,  1.16s/it]

saving model version 0.1
Model: "sequential_265"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1105 (Dense)          (None, 3)                 84        
                                                                 
 dense_1106 (Dense)          (None, 19)                76        
                                                                 
 dense_1107 (Dense)          (None, 1)                 20        
                                                                 
Total params: 180
Trainable params: 180
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 3.40e+01 | : 100%|███| 50/50 [00:33<00:00,  1.51it/s]

saving model version 0.1
Model: "sequential_266"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1108 (Dense)          (None, 26)                728       
                                                                 
 dense_1109 (Dense)          (None, 1)                 27        
                                                                 
Total params: 755
Trainable params: 755
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.02e+02 | : 100%|███| 50/50 [00:08<00:00,  5.96it/s]


saving model version 0.1
Model: "sequential_267"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1110 (Dense)          (None, 24)                672       
                                                                 
 dense_1111 (Dense)          (None, 26)                650       
                                                                 
 dense_1112 (Dense)          (None, 22)                594       
                                                                 
 dense_1113 (Dense)          (None, 1)                 23        
                                                                 
Total params: 1,939
Trainable params: 1,939
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.24e+03 | test_loss: nan | reg: 5.24e+01 | : 100%|███| 50/50 [00:37<00:00,  1.32it/s]

saving model version 0.1
Model: "sequential_268"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1114 (Dense)          (None, 34)                952       
                                                                 
 dense_1115 (Dense)          (None, 36)                1260      
                                                                 
 dense_1116 (Dense)          (None, 15)                555       
                                                                 
 dense_1117 (Dense)          (None, 1)                 16        
                                                                 
Total params: 2,783
Trainable params: 2,783
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.51e+03 | test_loss: nan | reg: 6.54e+01 | : 100%|███| 50/50 [00:53<00:00,  1.06s/it]

saving model version 0.1
Model: "sequential_269"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1118 (Dense)          (None, 19)                532       
                                                                 
 dense_1119 (Dense)          (None, 40)                800       
                                                                 
 dense_1120 (Dense)          (None, 19)                779       
                                                                 
 dense_1121 (Dense)          (None, 1)                 20        
                                                                 
Total params: 2,131
Trainable params: 2,131
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.60e+03 | test_loss: nan | reg: 6.47e+01 | : 100%|███| 50/50 [00:51<00:00,  1.02s/it]

saving model version 0.1
Model: "sequential_270"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1122 (Dense)          (None, 35)                980       
                                                                 
 dense_1123 (Dense)          (None, 43)                1548      
                                                                 
 dense_1124 (Dense)          (None, 34)                1496      
                                                                 
 dense_1125 (Dense)          (None, 18)                630       
                                                                 
 dense_1126 (Dense)          (None, 1)                 19        
                                                                 
Total params: 4,673
Trainable params: 4,673
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.33e+03 | test_loss: nan | reg: 7.59e+01 | : 100%|███| 50/50 [00:59<00:00,  1.19s/it]

saving model version 0.1
Model: "sequential_271"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1127 (Dense)          (None, 24)                672       
                                                                 
 dense_1128 (Dense)          (None, 14)                350       
                                                                 
 dense_1129 (Dense)          (None, 15)                225       
                                                                 
 dense_1130 (Dense)          (None, 1)                 16        
                                                                 
Total params: 1,263
Trainable params: 1,263
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 4.14e+01 | : 100%|███| 50/50 [00:38<00:00,  1.31it/s]

saving model version 0.1
Model: "sequential_272"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1131 (Dense)          (None, 31)                868       
                                                                 
 dense_1132 (Dense)          (None, 34)                1088      
                                                                 
 dense_1133 (Dense)          (None, 22)                770       
                                                                 
 dense_1134 (Dense)          (None, 1)                 23        
                                                                 
Total params: 2,749
Trainable params: 2,749
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.88e+03 | test_loss: nan | reg: 1.38e+03 | : 100%|███| 50/50 [00:29<00:00,  1.68it/s]

saving model version 0.1
Model: "sequential_273"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1135 (Dense)          (None, 21)                588       
                                                                 
 dense_1136 (Dense)          (None, 33)                726       
                                                                 
 dense_1137 (Dense)          (None, 22)                748       
                                                                 
 dense_1138 (Dense)          (None, 1)                 23        
                                                                 
Total params: 2,085
Trainable params: 2,085
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 1.11e+02 | : 100%|███| 50/50 [00:40<00:00,  1.25it/s]

saving model version 0.1
Model: "sequential_274"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1139 (Dense)          (None, 13)                364       
                                                                 
 dense_1140 (Dense)          (None, 19)                266       
                                                                 
 dense_1141 (Dense)          (None, 25)                500       
                                                                 
 dense_1142 (Dense)          (None, 1)                 26        
                                                                 
Total params: 1,156
Trainable params: 1,156
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.04e+03 | test_loss: nan | reg: 5.05e+01 | : 100%|███| 50/50 [00:51<00:00,  1.03s/it]

saving model version 0.1
Model: "sequential_275"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1143 (Dense)          (None, 32)                896       
                                                                 
 dense_1144 (Dense)          (None, 20)                660       
                                                                 
 dense_1145 (Dense)          (None, 1)                 21        
                                                                 
Total params: 1,577
Trainable params: 1,577
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.27e+03 | test_loss: nan | reg: 2.87e+01 | : 100%|███| 50/50 [00:26<00:00,  1.89it/s]

saving model version 0.1
Model: "sequential_276"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1146 (Dense)          (None, 23)                644       
                                                                 
 dense_1147 (Dense)          (None, 10)                240       
                                                                 
 dense_1148 (Dense)          (None, 30)                330       
                                                                 
 dense_1149 (Dense)          (None, 1)                 31        
                                                                 
Total params: 1,245
Trainable params: 1,245
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.42e+03 | test_loss: nan | reg: 7.96e+01 | : 100%|███| 50/50 [00:54<00:00,  1.09s/it]

saving model version 0.1
Model: "sequential_277"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1150 (Dense)          (None, 21)                588       
                                                                 
 dense_1151 (Dense)          (None, 31)                682       
                                                                 
 dense_1152 (Dense)          (None, 1)                 32        
                                                                 
Total params: 1,302
Trainable params: 1,302
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 3.78e+01 | : 100%|███| 50/50 [00:17<00:00,  2.83it/s]


saving model version 0.1
Model: "sequential_278"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1153 (Dense)          (None, 17)                476       
                                                                 
 dense_1154 (Dense)          (None, 30)                540       
                                                                 
 dense_1155 (Dense)          (None, 1)                 31        
                                                                 
Total params: 1,047
Trainable params: 1,047
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.26e+03 | test_loss: nan | reg: 3.38e+01 | : 100%|███| 50/50 [00:40<00:00,  1.24it/s]

saving model version 0.1
Model: "sequential_279"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1156 (Dense)          (None, 10)                280       
                                                                 
 dense_1157 (Dense)          (None, 32)                352       
                                                                 
 dense_1158 (Dense)          (None, 1)                 33        
                                                                 
Total params: 665
Trainable params: 665
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.19e+03 | test_loss: nan | reg: 5.68e+01 | : 100%|███| 50/50 [00:33<00:00,  1.48it/s]

saving model version 0.1
Model: "sequential_280"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1159 (Dense)          (None, 26)                728       
                                                                 
 dense_1160 (Dense)          (None, 19)                513       
                                                                 
 dense_1161 (Dense)          (None, 33)                660       
                                                                 
 dense_1162 (Dense)          (None, 27)                918       
                                                                 
 dense_1163 (Dense)          (None, 1)                 28        
                                                                 
Total params: 2,847
Trainable params: 2,847
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 5.49e+03 | test_loss: nan | reg: 1.87e+02 | : 100%|███| 50/50 [00:37<00:00,  1.34it/s]

saving model version 0.1
Model: "sequential_281"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1164 (Dense)          (None, 28)                784       
                                                                 
 dense_1165 (Dense)          (None, 35)                1015      
                                                                 
 dense_1166 (Dense)          (None, 32)                1152      
                                                                 
 dense_1167 (Dense)          (None, 35)                1155      
                                                                 
 dense_1168 (Dense)          (None, 28)                1008      
                                                                 
 dense_1169 (Dense)          (None, 1)                 29        
                                                                 
Total params: 5,143
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 7.04e+03 | test_loss: nan | reg: 2.07e+04 | : 100%|███| 50/50 [01:04<00:00,  1.30s/it]

saving model version 0.1
Model: "sequential_282"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1170 (Dense)          (None, 31)                868       
                                                                 
 dense_1171 (Dense)          (None, 31)                992       
                                                                 
 dense_1172 (Dense)          (None, 27)                864       
                                                                 
 dense_1173 (Dense)          (None, 20)                560       
                                                                 
 dense_1174 (Dense)          (None, 1)                 21        
                                                                 
Total params: 3,305
Trainable params: 3,305
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 5.17e+01 | : 100%|███| 50/50 [00:50<00:00,  1.01s/it]

saving model version 0.1
Model: "sequential_283"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1175 (Dense)          (None, 17)                476       
                                                                 
 dense_1176 (Dense)          (None, 1)                 18        
                                                                 
Total params: 494
Trainable params: 494
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 6.09e+02 | : 100%|███| 50/50 [00:12<00:00,  4.03it/s]

saving model version 0.1
Model: "sequential_284"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1177 (Dense)          (None, 7)                 196       
                                                                 
 dense_1178 (Dense)          (None, 12)                96        
                                                                 
 dense_1179 (Dense)          (None, 27)                351       
                                                                 
 dense_1180 (Dense)          (None, 1)                 28        





                                                                 
Total params: 671
Trainable params: 671
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.06e+02 | : 100%|███| 50/50 [00:28<00:00,  1.72it/s]

saving model version 0.1
Model: "sequential_285"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1181 (Dense)          (None, 33)                924       
                                                                 
 dense_1182 (Dense)          (None, 35)                1190      
                                                                 
 dense_1183 (Dense)          (None, 23)                828       
                                                                 
 dense_1184 (Dense)          (None, 1)                 24        
                                                                 
Total params: 2,966
Trainable params: 2,966
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.10e+03 | test_loss: nan | reg: 4.98e+01 | : 100%|███| 50/50 [00:39<00:00,  1.26it/s]

saving model version 0.1
Model: "sequential_286"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1185 (Dense)          (None, 15)                420       
                                                                 
 dense_1186 (Dense)          (None, 46)                736       
                                                                 
 dense_1187 (Dense)          (None, 34)                1598      
                                                                 
 dense_1188 (Dense)          (None, 1)                 35        
                                                                 
Total params: 2,789
Trainable params: 2,789
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.14e+03 | test_loss: nan | reg: 4.86e+01 | : 100%|███| 50/50 [00:52<00:00,  1.04s/it]

saving model version 0.1
Model: "sequential_287"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1189 (Dense)          (None, 2)                 56        
                                                                 
 dense_1190 (Dense)          (None, 38)                114       
                                                                 
 dense_1191 (Dense)          (None, 11)                429       
                                                                 
 dense_1192 (Dense)          (None, 28)                336       
                                                                 
 dense_1193 (Dense)          (None, 1)                 29        
                                                                 
Total params: 964
Trainable params: 964
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.59e+03 | test_loss: nan | reg: 7.58e+01 | : 100%|███| 50/50 [01:04<00:00,  1.30s/it]

saving model version 0.1
Model: "sequential_288"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1194 (Dense)          (None, 21)                588       
                                                                 
 dense_1195 (Dense)          (None, 33)                726       
                                                                 
 dense_1196 (Dense)          (None, 40)                1360      
                                                                 
 dense_1197 (Dense)          (None, 1)                 41        
                                                                 
Total params: 2,715
Trainable params: 2,715
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:48<00:00,  1.02it/s]

saving model version 0.1
ERROR ON SAMPLE 229
Model: "sequential_289"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1198 (Dense)          (None, 28)                784       
                                                                 
 dense_1199 (Dense)          (None, 14)                406       
                                                                 
 dense_1200 (Dense)          (None, 26)                390       
                                                                 
 dense_1201 (Dense)          (None, 25)                675       
                                                                 
 dense_1202 (Dense)          (None, 1)                 26        
                                                                 
Total params: 2,281
Trainable params: 2,281
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 6, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.14e+03 | test_loss: nan | reg: 4.60e+01 | : 100%|███| 50/50 [01:09<00:00,  1.40s/it]

saving model version 0.1
Model: "sequential_290"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1203 (Dense)          (None, 39)                1092      
                                                                 
 dense_1204 (Dense)          (None, 18)                720       
                                                                 
 dense_1205 (Dense)          (None, 17)                323       
                                                                 
 dense_1206 (Dense)          (None, 1)                 18        
                                                                 
Total params: 2,153
Trainable params: 2,153
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.60e+03 | test_loss: nan | reg: 5.25e+01 | : 100%|███| 50/50 [00:53<00:00,  1.07s/it]

saving model version 0.1
Model: "sequential_291"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1207 (Dense)          (None, 12)                336       
                                                                 
 dense_1208 (Dense)          (None, 16)                208       
                                                                 
 dense_1209 (Dense)          (None, 1)                 17        
                                                                 
Total params: 561
Trainable params: 561
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.20e+03 | test_loss: nan | reg: 4.16e+01 | : 100%|███| 50/50 [00:29<00:00,  1.72it/s]

saving model version 0.1
Model: "sequential_292"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1210 (Dense)          (None, 27)                756       
                                                                 
 dense_1211 (Dense)          (None, 21)                588       
                                                                 
 dense_1212 (Dense)          (None, 15)                330       
                                                                 
 dense_1213 (Dense)          (None, 10)                160       
                                                                 
 dense_1214 (Dense)          (None, 1)                 11        
                                                                 
Total params: 1,845
Trainable params: 1,845
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.21e+03 | test_loss: nan | reg: 4.91e+01 | : 100%|███| 50/50 [00:56<00:00,  1.13s/it]

saving model version 0.1
Model: "sequential_293"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1215 (Dense)          (None, 15)                420       
                                                                 
 dense_1216 (Dense)          (None, 34)                544       
                                                                 
 dense_1217 (Dense)          (None, 7)                 245       
                                                                 
 dense_1218 (Dense)          (None, 34)                272       
                                                                 
 dense_1219 (Dense)          (None, 1)                 35        
                                                                 
Total params: 1,516
Trainable params: 1,516
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.11e+03 | test_loss: nan | reg: 6.30e+01 | : 100%|███| 50/50 [01:02<00:00,  1.25s/it]

saving model version 0.1
Model: "sequential_294"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1220 (Dense)          (None, 33)                924       
                                                                 
 dense_1221 (Dense)          (None, 11)                374       
                                                                 
 dense_1222 (Dense)          (None, 21)                252       
                                                                 
 dense_1223 (Dense)          (None, 1)                 22        
                                                                 
Total params: 1,572
Trainable params: 1,572
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 9.73e+01 | : 100%|███| 50/50 [00:38<00:00,  1.29it/s]

saving model version 0.1
Model: "sequential_295"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1224 (Dense)          (None, 21)                588       
                                                                 
 dense_1225 (Dense)          (None, 33)                726       
                                                                 
 dense_1226 (Dense)          (None, 27)                918       
                                                                 
 dense_1227 (Dense)          (None, 20)                560       
                                                                 
 dense_1228 (Dense)          (None, 1)                 21        
                                                                 
Total params: 2,813
Trainable params: 2,813
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.24e+03 | test_loss: nan | reg: 7.17e+01 | : 100%|███| 50/50 [01:07<00:00,  1.35s/it]

saving model version 0.1
Model: "sequential_296"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1229 (Dense)          (None, 50)                1400      
                                                                 
 dense_1230 (Dense)          (None, 13)                663       
                                                                 
 dense_1231 (Dense)          (None, 17)                238       
                                                                 
 dense_1232 (Dense)          (None, 39)                702       
                                                                 
 dense_1233 (Dense)          (None, 1)                 40        
                                                                 
Total params: 3,043
Trainable params: 3,043
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.18e+03 | test_loss: nan | reg: 4.49e+01 | : 100%|███| 50/50 [00:51<00:00,  1.03s/it]

saving model version 0.1
Model: "sequential_297"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1234 (Dense)          (None, 23)                644       
                                                                 
 dense_1235 (Dense)          (None, 26)                624       
                                                                 
 dense_1236 (Dense)          (None, 31)                837       
                                                                 
 dense_1237 (Dense)          (None, 1)                 32        
                                                                 
Total params: 2,137
Trainable params: 2,137
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.80e+03 | test_loss: nan | reg: 8.12e+01 | : 100%|███| 50/50 [00:51<00:00,  1.02s/it]

saving model version 0.1
Model: "sequential_298"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1238 (Dense)          (None, 21)                588       
                                                                 
 dense_1239 (Dense)          (None, 18)                396       
                                                                 
 dense_1240 (Dense)          (None, 1)                 19        
                                                                 
Total params: 1,003
Trainable params: 1,003
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.18e+03 | test_loss: nan | reg: 4.23e+01 | : 100%|███| 50/50 [00:43<00:00,  1.16it/s]

saving model version 0.1
Model: "sequential_299"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1241 (Dense)          (None, 8)                 224       
                                                                 
 dense_1242 (Dense)          (None, 33)                297       
                                                                 
 dense_1243 (Dense)          (None, 1)                 34        
                                                                 
Total params: 555
Trainable params: 555
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.97e+03 | test_loss: nan | reg: 7.38e+01 | : 100%|███| 50/50 [00:34<00:00,  1.43it/s]

saving model version 0.1
Model: "sequential_300"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1244 (Dense)          (None, 44)                1232      
                                                                 
 dense_1245 (Dense)          (None, 30)                1350      
                                                                 
 dense_1246 (Dense)          (None, 17)                527       
                                                                 
 dense_1247 (Dense)          (None, 33)                594       
                                                                 
 dense_1248 (Dense)          (None, 1)                 34        
                                                                 
Total params: 3,737
Trainable params: 3,737
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.15e+03 | test_loss: nan | reg: 4.39e+01 | : 100%|███| 50/50 [01:10<00:00,  1.40s/it]

saving model version 0.1
Model: "sequential_301"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1249 (Dense)          (None, 26)                728       
                                                                 
 dense_1250 (Dense)          (None, 43)                1161      
                                                                 
 dense_1251 (Dense)          (None, 22)                968       
                                                                 
 dense_1252 (Dense)          (None, 1)                 23        
                                                                 
Total params: 2,880
Trainable params: 2,880
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.25e+03 | test_loss: nan | reg: 3.60e+01 | : 100%|███| 50/50 [00:38<00:00,  1.29it/s]


saving model version 0.1
Model: "sequential_302"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1253 (Dense)          (None, 18)                504       
                                                                 
 dense_1254 (Dense)          (None, 36)                684       
                                                                 
 dense_1255 (Dense)          (None, 4)                 148       
                                                                 
 dense_1256 (Dense)          (None, 36)                180       
                                                                 
 dense_1257 (Dense)          (None, 1)                 37        
                                                                 
Total params: 1,553
Trainable params: 1,553
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/1

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:59<00:00,  1.20s/it]

saving model version 0.1
ERROR ON SAMPLE 243
Model: "sequential_303"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1258 (Dense)          (None, 22)                616       
                                                                 
 dense_1259 (Dense)          (None, 11)                253       
                                                                 
 dense_1260 (Dense)          (None, 1)                 12        
                                                                 
Total params: 881
Trainable params: 881
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.26e+03 | test_loss: nan | reg: 2.82e+01 | : 100%|███| 50/50 [00:45<00:00,  1.11it/s]

saving model version 0.1
Model: "sequential_304"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1261 (Dense)          (None, 33)                924       
                                                                 
 dense_1262 (Dense)          (None, 24)                816       
                                                                 
 dense_1263 (Dense)          (None, 17)                425       
                                                                 
 dense_1264 (Dense)          (None, 1)                 18        
                                                                 
Total params: 2,183
Trainable params: 2,183
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.37e+03 | test_loss: nan | reg: 9.51e+01 | : 100%|███| 50/50 [00:39<00:00,  1.28it/s]

saving model version 0.1
Model: "sequential_305"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1265 (Dense)          (None, 25)                700       
                                                                 
 dense_1266 (Dense)          (None, 42)                1092      
                                                                 
 dense_1267 (Dense)          (None, 49)                2107      
                                                                 
 dense_1268 (Dense)          (None, 21)                1050      
                                                                 
 dense_1269 (Dense)          (None, 1)                 22        
                                                                 
Total params: 4,971
Trainable params: 4,971
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.10e+03 | test_loss: nan | reg: 7.47e+01 | : 100%|███| 50/50 [01:01<00:00,  1.23s/it]

saving model version 0.1
Model: "sequential_306"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1270 (Dense)          (None, 23)                644       
                                                                 
 dense_1271 (Dense)          (None, 40)                960       
                                                                 
 dense_1272 (Dense)          (None, 36)                1476      
                                                                 
 dense_1273 (Dense)          (None, 37)                1369      
                                                                 
 dense_1274 (Dense)          (None, 1)                 38        
                                                                 
Total params: 4,487
Trainable params: 4,487
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.63e+03 | test_loss: nan | reg: 7.61e+01 | : 100%|███| 50/50 [00:58<00:00,  1.18s/it]

saving model version 0.1
Model: "sequential_307"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1275 (Dense)          (None, 44)                1232      
                                                                 
 dense_1276 (Dense)          (None, 21)                945       
                                                                 
 dense_1277 (Dense)          (None, 11)                242       
                                                                 
 dense_1278 (Dense)          (None, 1)                 12        
                                                                 
Total params: 2,431
Trainable params: 2,431
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.18e+03 | test_loss: nan | reg: 4.17e+01 | : 100%|███| 50/50 [00:47<00:00,  1.05it/s]

saving model version 0.1
Model: "sequential_308"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1279 (Dense)          (None, 26)                728       
                                                                 
 dense_1280 (Dense)          (None, 31)                837       
                                                                 
 dense_1281 (Dense)          (None, 43)                1376      
                                                                 
 dense_1282 (Dense)          (None, 32)                1408      
                                                                 
 dense_1283 (Dense)          (None, 1)                 33        
                                                                 
Total params: 4,382
Trainable params: 4,382
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.57e+03 | test_loss: nan | reg: 6.55e+04 | : 100%|███| 50/50 [00:46<00:00,  1.07it/s]

saving model version 0.1
Model: "sequential_309"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1284 (Dense)          (None, 16)                448       
                                                                 
 dense_1285 (Dense)          (None, 10)                170       
                                                                 
 dense_1286 (Dense)          (None, 1)                 11        
                                                                 
Total params: 629
Trainable params: 629
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.60e+03 | test_loss: nan | reg: 5.99e+01 | : 100%|███| 50/50 [00:41<00:00,  1.21it/s]

saving model version 0.1
Model: "sequential_310"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1287 (Dense)          (None, 28)                784       
                                                                 
 dense_1288 (Dense)          (None, 23)                667       
                                                                 
 dense_1289 (Dense)          (None, 1)                 24        
                                                                 
Total params: 1,475
Trainable params: 1,475
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 2.71e+01 | : 100%|███| 50/50 [00:15<00:00,  3.23it/s]


saving model version 0.1
Model: "sequential_311"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1290 (Dense)          (None, 24)                672       
                                                                 
 dense_1291 (Dense)          (None, 9)                 225       
                                                                 
 dense_1292 (Dense)          (None, 37)                370       
                                                                 
 dense_1293 (Dense)          (None, 1)                 38        
                                                                 
Total params: 1,305
Trainable params: 1,305
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 3.35e+01 | : 100%|███| 50/50 [00:40<00:00,  1.24it/s]

saving model version 0.1
Model: "sequential_312"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1294 (Dense)          (None, 14)                392       
                                                                 
 dense_1295 (Dense)          (None, 58)                870       
                                                                 
 dense_1296 (Dense)          (None, 20)                1180      
                                                                 
 dense_1297 (Dense)          (None, 19)                399       
                                                                 
 dense_1298 (Dense)          (None, 1)                 20        
                                                                 
Total params: 2,861
Trainable params: 2,861
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:56<00:00,  1.13s/it]

saving model version 0.1
ERROR ON SAMPLE 253
Model: "sequential_313"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1299 (Dense)          (None, 27)                756       
                                                                 
 dense_1300 (Dense)          (None, 13)                364       
                                                                 
 dense_1301 (Dense)          (None, 17)                238       
                                                                 
 dense_1302 (Dense)          (None, 32)                576       
                                                                 
 dense_1303 (Dense)          (None, 20)                660       
                                                                 
 dense_1304 (Dense)          (None, 1)                 21        
                                                                 
Total p




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 3, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.73e+03 | test_loss: nan | reg: 5.14e+03 | : 100%|███| 50/50 [01:25<00:00,  1.72s/it]


saving model version 0.1
Model: "sequential_314"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1305 (Dense)          (None, 23)                644       
                                                                 
 dense_1306 (Dense)          (None, 1)                 24        
                                                                 
Total params: 668
Trainable params: 668
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.27e+03 | test_loss: nan | reg: 1.25e+02 | : 100%|███| 50/50 [00:14<00:00,  3.48it/s]

saving model version 0.1
Model: "sequential_315"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1307 (Dense)          (None, 19)                532       
                                                                 
 dense_1308 (Dense)          (None, 21)                420       
                                                                 
 dense_1309 (Dense)          (None, 24)                528       
                                                                 
 dense_1310 (Dense)          (None, 1)                 25        
                                                                 
Total params: 1,505
Trainable params: 1,505
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.80e+03 | test_loss: nan | reg: 6.49e+01 | : 100%|███| 50/50 [00:51<00:00,  1.02s/it]

saving model version 0.1
Model: "sequential_316"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1311 (Dense)          (None, 32)                896       
                                                                 
 dense_1312 (Dense)          (None, 29)                957       
                                                                 
 dense_1313 (Dense)          (None, 17)                510       
                                                                 
 dense_1314 (Dense)          (None, 45)                810       
                                                                 
 dense_1315 (Dense)          (None, 1)                 46        
                                                                 
Total params: 3,219
Trainable params: 3,219
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:50<00:00,  1.01s/it]

saving model version 0.1
ERROR ON SAMPLE 257
Model: "sequential_317"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1316 (Dense)          (None, 19)                532       
                                                                 
 dense_1317 (Dense)          (None, 18)                360       
                                                                 
 dense_1318 (Dense)          (None, 34)                646       
                                                                 
 dense_1319 (Dense)          (None, 1)                 35        
                                                                 
Total params: 1,573
Trainable params: 1,573
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.23e+03 | test_loss: nan | reg: 5.79e+01 | : 100%|███| 50/50 [00:50<00:00,  1.01s/it]

saving model version 0.1
Model: "sequential_318"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1320 (Dense)          (None, 28)                784       
                                                                 
 dense_1321 (Dense)          (None, 21)                609       
                                                                 
 dense_1322 (Dense)          (None, 1)                 22        
                                                                 
Total params: 1,415
Trainable params: 1,415
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.24e+03 | test_loss: nan | reg: 4.90e+01 | : 100%|███| 50/50 [00:26<00:00,  1.89it/s]

saving model version 0.1
Model: "sequential_319"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1323 (Dense)          (None, 23)                644       
                                                                 
 dense_1324 (Dense)          (None, 18)                432       
                                                                 
 dense_1325 (Dense)          (None, 29)                551       
                                                                 
 dense_1326 (Dense)          (None, 1)                 30        
                                                                 
Total params: 1,657
Trainable params: 1,657
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 5.58e+03 | test_loss: nan | reg: 6.42e+03 | : 100%|███| 50/50 [00:20<00:00,  2.49it/s]

saving model version 0.1
Model: "sequential_320"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1327 (Dense)          (None, 39)                1092      
                                                                 
 dense_1328 (Dense)          (None, 37)                1480      
                                                                 
 dense_1329 (Dense)          (None, 21)                798       
                                                                 
 dense_1330 (Dense)          (None, 1)                 22        
                                                                 
Total params: 3,392
Trainable params: 3,392
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.44e+03 | test_loss: nan | reg: 7.81e+01 | : 100%|███| 50/50 [00:45<00:00,  1.10it/s]

saving model version 0.1
Model: "sequential_321"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1331 (Dense)          (None, 18)                504       
                                                                 
 dense_1332 (Dense)          (None, 28)                532       
                                                                 
 dense_1333 (Dense)          (None, 29)                841       
                                                                 
 dense_1334 (Dense)          (None, 6)                 180       
                                                                 
 dense_1335 (Dense)          (None, 14)                98        
                                                                 
 dense_1336 (Dense)          (None, 1)                 15        
                                                                 
Total params: 2,170
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 2, 2, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.33e+03 | test_loss: nan | reg: 3.81e+02 | : 100%|███| 50/50 [00:44<00:00,  1.13it/s]

saving model version 0.1
Model: "sequential_322"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1337 (Dense)          (None, 29)                812       
                                                                 
 dense_1338 (Dense)          (None, 52)                1560      
                                                                 
 dense_1339 (Dense)          (None, 26)                1378      
                                                                 
 dense_1340 (Dense)          (None, 28)                756       
                                                                 
 dense_1341 (Dense)          (None, 36)                1044      
                                                                 
 dense_1342 (Dense)          (None, 1)                 37        
                                                                 
Total params: 5,587
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.34e+03 | test_loss: nan | reg: 3.40e+02 | : 100%|███| 50/50 [01:13<00:00,  1.48s/it]

saving model version 0.1
Model: "sequential_323"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1343 (Dense)          (None, 35)                980       
                                                                 
 dense_1344 (Dense)          (None, 26)                936       
                                                                 
 dense_1345 (Dense)          (None, 1)                 27        
                                                                 
Total params: 1,943
Trainable params: 1,943
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 5.10e+01 | : 100%|███| 50/50 [00:18<00:00,  2.75it/s]

saving model version 0.1
Model: "sequential_324"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1346 (Dense)          (None, 27)                756       
                                                                 
 dense_1347 (Dense)          (None, 39)                1092      
                                                                 
 dense_1348 (Dense)          (None, 16)                640       
                                                                 
 dense_1349 (Dense)          (None, 25)                425       
                                                                 
 dense_1350 (Dense)          (None, 26)                676       
                                                                 
 dense_1351 (Dense)          (None, 1)                 27        
                                                                 
Total params: 3,616
Trainab




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.44e+03 | test_loss: nan | reg: 1.42e+02 | : 100%|███| 50/50 [00:45<00:00,  1.09it/s]

saving model version 0.1
Model: "sequential_325"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1352 (Dense)          (None, 10)                280       
                                                                 
 dense_1353 (Dense)          (None, 28)                308       
                                                                 
 dense_1354 (Dense)          (None, 25)                725       
                                                                 
 dense_1355 (Dense)          (None, 1)                 26        
                                                                 
Total params: 1,339
Trainable params: 1,339
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.47e+03 | test_loss: nan | reg: 7.09e+01 | : 100%|███| 50/50 [00:53<00:00,  1.07s/it]

saving model version 0.1
Model: "sequential_326"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1356 (Dense)          (None, 13)                364       
                                                                 
 dense_1357 (Dense)          (None, 27)                378       
                                                                 
 dense_1358 (Dense)          (None, 22)                616       
                                                                 
 dense_1359 (Dense)          (None, 1)                 23        
                                                                 
Total params: 1,381
Trainable params: 1,381
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.14e+03 | test_loss: nan | reg: 6.44e+01 | : 100%|███| 50/50 [00:45<00:00,  1.09it/s]

saving model version 0.1
Model: "sequential_327"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1360 (Dense)          (None, 17)                476       
                                                                 
 dense_1361 (Dense)          (None, 37)                666       
                                                                 
 dense_1362 (Dense)          (None, 35)                1330      
                                                                 
 dense_1363 (Dense)          (None, 1)                 36        
                                                                 
Total params: 2,508
Trainable params: 2,508
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.17e+03 | test_loss: nan | reg: 4.15e+01 | : 100%|███| 50/50 [00:41<00:00,  1.21it/s]

saving model version 0.1
Model: "sequential_328"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1364 (Dense)          (None, 21)                588       
                                                                 
 dense_1365 (Dense)          (None, 24)                528       
                                                                 
 dense_1366 (Dense)          (None, 1)                 25        
                                                                 
Total params: 1,141
Trainable params: 1,141
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.22e+03 | test_loss: nan | reg: 2.63e+01 | : 100%|███| 50/50 [00:23<00:00,  2.17it/s]

saving model version 0.1
Model: "sequential_329"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1367 (Dense)          (None, 31)                868       
                                                                 
 dense_1368 (Dense)          (None, 24)                768       
                                                                 
 dense_1369 (Dense)          (None, 15)                375       
                                                                 
 dense_1370 (Dense)          (None, 18)                288       
                                                                 
 dense_1371 (Dense)          (None, 1)                 19        
                                                                 





Total params: 2,318
Trainable params: 2,318
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.32e+03 | test_loss: nan | reg: 5.60e+01 | : 100%|███| 50/50 [00:32<00:00,  1.53it/s]

saving model version 0.1
Model: "sequential_330"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1372 (Dense)          (None, 37)                1036      
                                                                 
 dense_1373 (Dense)          (None, 18)                684       
                                                                 
 dense_1374 (Dense)          (None, 1)                 19        
                                                                 
Total params: 1,739
Trainable params: 1,739
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.09e+03 | test_loss: nan | reg: 4.67e+01 | : 100%|███| 50/50 [00:36<00:00,  1.38it/s]

saving model version 0.1
Model: "sequential_331"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1375 (Dense)          (None, 22)                616       
                                                                 
 dense_1376 (Dense)          (None, 29)                667       
                                                                 
 dense_1377 (Dense)          (None, 24)                720       
                                                                 
 dense_1378 (Dense)          (None, 16)                400       
                                                                 
 dense_1379 (Dense)          (None, 1)                 17        
                                                                 
Total params: 2,420
Trainable params: 2,420
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 3, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.12e+03 | test_loss: nan | reg: 4.71e+01 | : 100%|███| 50/50 [00:59<00:00,  1.20s/it]

saving model version 0.1
Model: "sequential_332"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1380 (Dense)          (None, 25)                700       
                                                                 
 dense_1381 (Dense)          (None, 35)                910       
                                                                 
 dense_1382 (Dense)          (None, 31)                1116      
                                                                 
 dense_1383 (Dense)          (None, 20)                640       
                                                                 
 dense_1384 (Dense)          (None, 1)                 21        
                                                                 
Total params: 3,387
Trainable params: 3,387
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.26e+03 | test_loss: nan | reg: 6.27e+01 | : 100%|███| 50/50 [00:57<00:00,  1.15s/it]

saving model version 0.1
Model: "sequential_333"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1385 (Dense)          (None, 9)                 252       
                                                                 
 dense_1386 (Dense)          (None, 25)                250       
                                                                 
 dense_1387 (Dense)          (None, 17)                442       
                                                                 
 dense_1388 (Dense)          (None, 18)                324       
                                                                 
 dense_1389 (Dense)          (None, 1)                 19        
                                                                 
Total params: 1,287
Trainable params: 1,287
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 2, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.90e+03 | test_loss: nan | reg: 4.83e+01 | : 100%|███| 50/50 [00:58<00:00,  1.16s/it]


saving model version 0.1
Model: "sequential_334"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1390 (Dense)          (None, 21)                588       
                                                                 
 dense_1391 (Dense)          (None, 22)                484       
                                                                 
 dense_1392 (Dense)          (None, 16)                368       
                                                                 
 dense_1393 (Dense)          (None, 34)                578       
                                                                 
 dense_1394 (Dense)          (None, 30)                1050      
                                                                 
 dense_1395 (Dense)          (None, 1)                 31        
                                                                 
Total params: 3,099
Trainab

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.95e+03 | test_loss: nan | reg: 7.87e+01 | : 100%|███| 50/50 [01:28<00:00,  1.77s/it]

saving model version 0.1
Model: "sequential_335"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1396 (Dense)          (None, 31)                868       
                                                                 
 dense_1397 (Dense)          (None, 15)                480       
                                                                 
 dense_1398 (Dense)          (None, 32)                512       
                                                                 
 dense_1399 (Dense)          (None, 1)                 33        
                                                                 
Total params: 1,893
Trainable params: 1,893
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.63e+03 | test_loss: nan | reg: 7.18e+01 | : 100%|███| 50/50 [00:58<00:00,  1.17s/it]

saving model version 0.1
Model: "sequential_336"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1400 (Dense)          (None, 23)                644       
                                                                 
 dense_1401 (Dense)          (None, 1)                 24        
                                                                 
Total params: 668
Trainable params: 668
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.02e+02 | : 100%|███| 50/50 [00:08<00:00,  6.02it/s]

saving model version 0.1
Model: "sequential_337"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1402 (Dense)          (None, 26)                728       
                                                                 
 dense_1403 (Dense)          (None, 32)                864       
                                                                 
 dense_1404 (Dense)          (None, 38)                1254      
                                                                 
 dense_1405 (Dense)          (None, 13)                507       
                                                                 
 dense_1406 (Dense)          (None, 32)                448       
                                                                 
 dense_1407 (Dense)          (None, 1)                 33        





                                                                 
Total params: 3,834
Trainable params: 3,834
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.03e+03 | test_loss: nan | reg: 6.62e+01 | : 100%|███| 50/50 [01:22<00:00,  1.64s/it]

saving model version 0.1
Model: "sequential_338"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1408 (Dense)          (None, 51)                1428      
                                                                 
 dense_1409 (Dense)          (None, 32)                1664      
                                                                 
 dense_1410 (Dense)          (None, 29)                957       
                                                                 
 dense_1411 (Dense)          (None, 1)                 30        
                                                                 
Total params: 4,079
Trainable params: 4,079
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.08e+03 | test_loss: nan | reg: 3.91e+01 | : 100%|███| 50/50 [00:44<00:00,  1.12it/s]

saving model version 0.1
Model: "sequential_339"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1412 (Dense)          (None, 20)                560       
                                                                 
 dense_1413 (Dense)          (None, 24)                504       
                                                                 
 dense_1414 (Dense)          (None, 9)                 225       
                                                                 
 dense_1415 (Dense)          (None, 1)                 10        
                                                                 
Total params: 1,299
Trainable params: 1,299
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.11e+03 | test_loss: nan | reg: 5.04e+01 | : 100%|███| 50/50 [00:49<00:00,  1.01it/s]

saving model version 0.1
Model: "sequential_340"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1416 (Dense)          (None, 24)                672       
                                                                 
 dense_1417 (Dense)          (None, 18)                450       
                                                                 
 dense_1418 (Dense)          (None, 1)                 19        
                                                                 
Total params: 1,141
Trainable params: 1,141
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.72e+03 | test_loss: nan | reg: 9.25e+01 | : 100%|███| 50/50 [00:36<00:00,  1.38it/s]

saving model version 0.1
Model: "sequential_341"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1419 (Dense)          (None, 9)                 252       
                                                                 
 dense_1420 (Dense)          (None, 18)                180       
                                                                 
 dense_1421 (Dense)          (None, 1)                 19        
                                                                 
Total params: 451
Trainable params: 451
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.64e+03 | test_loss: nan | reg: 2.58e+05 | : 100%|███| 50/50 [00:30<00:00,  1.62it/s]

saving model version 0.1
Model: "sequential_342"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1422 (Dense)          (None, 34)                952       
                                                                 
 dense_1423 (Dense)          (None, 1)                 35        
                                                                 
Total params: 987
Trainable params: 987
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 1.03e+02 | : 100%|███| 50/50 [00:10<00:00,  4.87it/s]


saving model version 0.1
Model: "sequential_343"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1424 (Dense)          (None, 15)                420       
                                                                 
 dense_1425 (Dense)          (None, 24)                384       
                                                                 
 dense_1426 (Dense)          (None, 18)                450       
                                                                 
 dense_1427 (Dense)          (None, 1)                 19        
                                                                 
Total params: 1,273
Trainable params: 1,273
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory create

  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.23e+03 | test_loss: nan | reg: 7.87e+01 | : 100%|███| 50/50 [00:34<00:00,  1.46it/s]

saving model version 0.1
Model: "sequential_344"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1428 (Dense)          (None, 45)                1260      
                                                                 
 dense_1429 (Dense)          (None, 28)                1288      
                                                                 
 dense_1430 (Dense)          (None, 36)                1044      
                                                                 
 dense_1431 (Dense)          (None, 25)                925       
                                                                 
 dense_1432 (Dense)          (None, 1)                 26        
                                                                 
Total params: 4,543
Trainable params: 4,543
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 2, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.71e+03 | test_loss: nan | reg: 2.60e+03 | : 100%|███| 50/50 [00:49<00:00,  1.02it/s]

saving model version 0.1
Model: "sequential_345"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1433 (Dense)          (None, 19)                532       
                                                                 
 dense_1434 (Dense)          (None, 18)                360       
                                                                 
 dense_1435 (Dense)          (None, 35)                665       
                                                                 
 dense_1436 (Dense)          (None, 1)                 36        
                                                                 
Total params: 1,593
Trainable params: 1,593
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.16e+03 | test_loss: nan | reg: 5.17e+01 | : 100%|███| 50/50 [00:44<00:00,  1.12it/s]

saving model version 0.1
Model: "sequential_346"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1437 (Dense)          (None, 17)                476       
                                                                 
 dense_1438 (Dense)          (None, 29)                522       
                                                                 
 dense_1439 (Dense)          (None, 30)                900       
                                                                 
 dense_1440 (Dense)          (None, 1)                 31        
                                                                 
Total params: 1,929
Trainable params: 1,929
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [00:53<00:00,  1.07s/it]

saving model version 0.1
ERROR ON SAMPLE 287
Model: "sequential_347"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1441 (Dense)          (None, 29)                812       
                                                                 
 dense_1442 (Dense)          (None, 34)                1020      
                                                                 
 dense_1443 (Dense)          (None, 12)                420       
                                                                 
 dense_1444 (Dense)          (None, 40)                520       
                                                                 
 dense_1445 (Dense)          (None, 16)                656       
                                                                 
 dense_1446 (Dense)          (None, 1)                 17        
                                                                 
Total p




None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 4, 3, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.31e+03 | test_loss: nan | reg: 2.49e+02 | : 100%|███| 50/50 [01:15<00:00,  1.50s/it]

saving model version 0.1
Model: "sequential_348"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1447 (Dense)          (None, 43)                1204      
                                                                 
 dense_1448 (Dense)          (None, 17)                748       
                                                                 
 dense_1449 (Dense)          (None, 35)                630       
                                                                 
 dense_1450 (Dense)          (None, 1)                 36        
                                                                 
Total params: 2,618
Trainable params: 2,618
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 2, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.99e+03 | test_loss: nan | reg: 5.54e+01 | : 100%|███| 50/50 [00:39<00:00,  1.27it/s]

saving model version 0.1
Model: "sequential_349"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1451 (Dense)          (None, 16)                448       
                                                                 
 dense_1452 (Dense)          (None, 23)                391       
                                                                 
 dense_1453 (Dense)          (None, 1)                 24        
                                                                 
Total params: 863
Trainable params: 863
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.28e+03 | test_loss: nan | reg: 4.51e+01 | : 100%|███| 50/50 [00:21<00:00,  2.31it/s]

saving model version 0.1
Model: "sequential_350"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1454 (Dense)          (None, 18)                504       
                                                                 
 dense_1455 (Dense)          (None, 43)                817       
                                                                 
 dense_1456 (Dense)          (None, 38)                1672      
                                                                 
 dense_1457 (Dense)          (None, 1)                 39        
                                                                 
Total params: 3,032
Trainable params: 3,032
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.17e+03 | test_loss: nan | reg: 3.99e+01 | : 100%|███| 50/50 [00:40<00:00,  1.25it/s]

saving model version 0.1
Model: "sequential_351"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1458 (Dense)          (None, 11)                308       
                                                                 
 dense_1459 (Dense)          (None, 50)                600       
                                                                 
 dense_1460 (Dense)          (None, 1)                 51        
                                                                 
Total params: 959
Trainable params: 959
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.27e+03 | test_loss: nan | reg: 4.13e+01 | : 100%|███| 50/50 [00:27<00:00,  1.84it/s]

saving model version 0.1
Model: "sequential_352"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1461 (Dense)          (None, 34)                952       
                                                                 
 dense_1462 (Dense)          (None, 39)                1365      
                                                                 
 dense_1463 (Dense)          (None, 29)                1160      
                                                                 
 dense_1464 (Dense)          (None, 18)                540       
                                                                 
 dense_1465 (Dense)          (None, 1)                 19        
                                                                 
Total params: 4,036
Trainable params: 4,036
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 5, 3, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.29e+03 | test_loss: nan | reg: 5.31e+01 | : 100%|███| 50/50 [00:46<00:00,  1.08it/s]

saving model version 0.1
Model: "sequential_353"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1466 (Dense)          (None, 29)                812       
                                                                 
 dense_1467 (Dense)          (None, 27)                810       
                                                                 
 dense_1468 (Dense)          (None, 1)                 28        
                                                                 
Total params: 1,650
Trainable params: 1,650
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.19e+03 | test_loss: nan | reg: 2.34e+01 | : 100%|███| 50/50 [00:36<00:00,  1.37it/s]

saving model version 0.1
Model: "sequential_354"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1469 (Dense)          (None, 36)                1008      
                                                                 
 dense_1470 (Dense)          (None, 1)                 37        
                                                                 
Total params: 1,045
Trainable params: 1,045
Non-trainable params: 0
_________________________________________________________________
None
Epoch 1/10





Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.27e+03 | test_loss: nan | reg: 1.09e+02 | : 100%|███| 50/50 [00:14<00:00,  3.49it/s]

saving model version 0.1
Model: "sequential_355"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1471 (Dense)          (None, 15)                420       
                                                                 
 dense_1472 (Dense)          (None, 25)                400       
                                                                 
 dense_1473 (Dense)          (None, 39)                1014      
                                                                 
 dense_1474 (Dense)          (None, 44)                1760      
                                                                 
 dense_1475 (Dense)          (None, 1)                 45        
                                                                 
Total params: 3,639
Trainable params: 3,639
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 6, 4, 4, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.49e+03 | test_loss: nan | reg: 7.31e+01 | : 100%|███| 50/50 [01:21<00:00,  1.64s/it]

saving model version 0.1
Model: "sequential_356"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1476 (Dense)          (None, 25)                700       
                                                                 
 dense_1477 (Dense)          (None, 27)                702       
                                                                 
 dense_1478 (Dense)          (None, 28)                784       
                                                                 
 dense_1479 (Dense)          (None, 1)                 29        
                                                                 
Total params: 2,215
Trainable params: 2,215
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 3.86e+03 | test_loss: nan | reg: 9.35e+01 | : 100%|███| 50/50 [00:46<00:00,  1.07it/s]

saving model version 0.1
Model: "sequential_357"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1480 (Dense)          (None, 43)                1204      
                                                                 
 dense_1481 (Dense)          (None, 32)                1408      
                                                                 
 dense_1482 (Dense)          (None, 20)                660       
                                                                 
 dense_1483 (Dense)          (None, 21)                441       
                                                                 
 dense_1484 (Dense)          (None, 1)                 22        
                                                                 
Total params: 3,735
Trainable params: 3,735
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 4, 5, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: nan | test_loss: nan | reg: nan | : 100%|█████████████| 50/50 [01:02<00:00,  1.24s/it]

saving model version 0.1
ERROR ON SAMPLE 298
Model: "sequential_358"
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
 dense_1485 (Dense)          (None, 8)                 224       
                                                                 
 dense_1486 (Dense)          (None, 25)                225       
                                                                 
 dense_1487 (Dense)          (None, 1)                 26        
                                                                 
Total params: 475
Trainable params: 475
Non-trainable params: 0
_________________________________________________________________





None
Epoch 1/10
Epoch 2/10
Epoch 3/10
Epoch 4/10
Epoch 5/10
Epoch 6/10
Epoch 7/10
Epoch 8/10
Epoch 9/10
Epoch 10/10
[27, 3, 1]
checkpoint directory created: ./model
saving model version 0.0


  self.subnode_actscale.append(torch.std(x, dim=0).detach())
  input_range = torch.std(preacts, dim=0) + 0.1
  output_range_spline = torch.std(postacts_numerical, dim=0) # for training, only penalize the spline part
  output_range = torch.std(postacts, dim=0) # for visualization, include the contribution from both spline + symbolic
| train_loss: 4.30e+03 | test_loss: nan | reg: 2.43e+01 | : 100%|███| 50/50 [00:27<00:00,  1.83it/s]

saving model version 0.1



