# HPO

In [26]:
import iqpopt as iqp
from iqpopt.utils import initialize_from_data, local_gates
import iqpopt.gen_qml as genq
from iqpopt.gen_qml.utils import median_heuristic
import optuna
import pennylane as qml
import jax
from jax import numpy as jnp
from utils.nisq import aachen_connectivity, efficient_connectivity_gates
from datasets.bipartites import BipartiteGraphDataset
from datasets.er import ErdosRenyiGraphDataset
import numpy as np

In [27]:
NODES = 8
TYPE = "Bipartite"
CONN = "Medium"
NUM_LAYERS = 1
QUBITS = NODES * (NODES - 1) //2

In [28]:
ds_path = f'./datasets/raw_data/{NODES}N_{TYPE}_{CONN}.pkl'
train_ds = jnp.array(BipartiteGraphDataset(nodes = 1, edge_prob=0.1).from_file(ds_path).vectors.copy())

[Dataset] Loaded 271 samples from ./datasets/raw_data/8N_Bipartite_Medium.pkl
  Created: 2025-05-30T13:15:17.387588
  Unique graphs: 271
  Version: 1.0


In [29]:
grid_conn = aachen_connectivity()
gates = efficient_connectivity_gates(grid_conn, QUBITS, 1) 
circ = iqp.IqpSimulator(QUBITS, gates, device='lightning.qubit')

base_key = jax.random.PRNGKey(42)

In [30]:
base_sigma = median_heuristic(train_ds)

In [31]:
from utils.hpo import run_hpo

In [32]:
study = run_hpo(
    grid_conn,
    QUBITS,
    base_sigma,
    train_ds = train_ds,
    n_trials = 100,
    n_iters_hpo = 150,
    n_ops = 2000,
    n_samples = 2000,
)

[I 2025-06-07 22:03:32,083] A new study created in memory with name: no-name-f787b184-2c50-4cb3-a9d3-4ad6e2b74f09


Trial 0:
  Learning Rate: 0.0025567885528974305
  Sigma Multiplier: 1.783348193573144
  Initialization Multiplier: 0.22222473061580392
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 22.20it/s, loss=-0.000167, elapsed time=0.03, total time=7.71]
[I 2025-06-07 22:03:40,197] Trial 0 finished with value: -0.00016690732082928002 and parameters: {'learning_rate': 0.0025567885528974305, 'sigma_multiplier': 1.783348193573144, 'num_layers': 5, 'initialization_multiplier': 0.22222473061580392}. Best is trial 0 with value: -0.00016690732082928002.


Training has not converged after 150 steps
Trial 0 final loss: -0.00016691
Trial 1:
  Learning Rate: 0.01105749832032795
  Sigma Multiplier: 1.4072101856106365
  Initialization Multiplier: 1.8130626767089446
  Number of Layers: 2


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 22.32it/s, loss=-0.000140, elapsed time=0.03, total time=6.99]
[I 2025-06-07 22:03:47,300] Trial 1 finished with value: -0.0001401237736701446 and parameters: {'learning_rate': 0.01105749832032795, 'sigma_multiplier': 1.4072101856106365, 'num_layers': 2, 'initialization_multiplier': 1.8130626767089446}. Best is trial 0 with value: -0.00016690732082928002.


Training has not converged after 150 steps
Trial 1 final loss: -0.00014012
Trial 2:
  Learning Rate: 0.028125188346190263
  Sigma Multiplier: 1.7983111155356568
  Initialization Multiplier: 1.9027821119275237
  Number of Layers: 1


Training Progress: 100%|██████████| 150/150 [00:03<00:00, 37.87it/s, loss=-0.000189, elapsed time=0.02, total time=4.19]
[I 2025-06-07 22:03:51,562] Trial 2 finished with value: -0.0001893437554216291 and parameters: {'learning_rate': 0.028125188346190263, 'sigma_multiplier': 1.7983111155356568, 'num_layers': 1, 'initialization_multiplier': 1.9027821119275237}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 2 final loss: -0.00018934
Trial 3:
  Learning Rate: 0.01445603922833321
  Sigma Multiplier: 0.25386366186939124
  Initialization Multiplier: 1.2993560213751045
  Number of Layers: 2


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 19.15it/s, loss=0.001565, elapsed time=0.05, total time=8.02]
[I 2025-06-07 22:03:59,599] Trial 3 finished with value: 0.0015654975949777885 and parameters: {'learning_rate': 0.01445603922833321, 'sigma_multiplier': 0.25386366186939124, 'num_layers': 2, 'initialization_multiplier': 1.2993560213751045}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 3 final loss: 0.00156550
Trial 4:
  Learning Rate: 7.137624680463252e-05
  Sigma Multiplier: 0.8946783600711018
  Initialization Multiplier: 1.4094285783414464
  Number of Layers: 3


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 22.98it/s, loss=0.101139, elapsed time=0.04, total time=6.81]
[I 2025-06-07 22:04:06,529] Trial 4 finished with value: 0.10113895457628126 and parameters: {'learning_rate': 7.137624680463252e-05, 'sigma_multiplier': 0.8946783600711018, 'num_layers': 3, 'initialization_multiplier': 1.4094285783414464}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 4 final loss: 0.10113895
Trial 5:
  Learning Rate: 0.004062221437972854
  Sigma Multiplier: 0.4894635555843013
  Initialization Multiplier: 1.247292729766109
  Number of Layers: 3


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 18.10it/s, loss=0.013728, elapsed time=0.05, total time=8.49]
[I 2025-06-07 22:04:15,044] Trial 5 finished with value: 0.013727762925471206 and parameters: {'learning_rate': 0.004062221437972854, 'sigma_multiplier': 0.4894635555843013, 'num_layers': 3, 'initialization_multiplier': 1.247292729766109}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 5 final loss: 0.01372776
Trial 6:
  Learning Rate: 0.0024645530189435555
  Sigma Multiplier: 1.1474889112339182
  Initialization Multiplier: 1.5900220039258495
  Number of Layers: 1


Training Progress: 100%|██████████| 150/150 [00:04<00:00, 31.10it/s, loss=0.007878, elapsed time=0.02, total time=5.02]
[I 2025-06-07 22:04:20,075] Trial 6 finished with value: 0.00787848147178078 and parameters: {'learning_rate': 0.0024645530189435555, 'sigma_multiplier': 1.1474889112339182, 'num_layers': 1, 'initialization_multiplier': 1.5900220039258495}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 6 final loss: 0.00787848
Trial 7:
  Learning Rate: 0.00010720365853124194
  Sigma Multiplier: 0.4077820618442223
  Initialization Multiplier: 1.7045901126196836
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 16.53it/s, loss=0.040150, elapsed time=0.07, total time=9.32]
[I 2025-06-07 22:04:29,541] Trial 7 finished with value: 0.040150257731159225 and parameters: {'learning_rate': 0.00010720365853124194, 'sigma_multiplier': 0.4077820618442223, 'num_layers': 4, 'initialization_multiplier': 1.7045901126196836}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 7 final loss: 0.04015026
Trial 8:
  Learning Rate: 0.0026542031205753435
  Sigma Multiplier: 0.7047761721362292
  Initialization Multiplier: 1.5941776723709296
  Number of Layers: 3


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 21.02it/s, loss=0.004391, elapsed time=0.04, total time=7.34]
[I 2025-06-07 22:04:36,904] Trial 8 finished with value: 0.004390632346879258 and parameters: {'learning_rate': 0.0026542031205753435, 'sigma_multiplier': 0.7047761721362292, 'num_layers': 3, 'initialization_multiplier': 1.5941776723709296}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 8 final loss: 0.00439063
Trial 9:
  Learning Rate: 3.655338942353789e-05
  Sigma Multiplier: 1.8822787357169253
  Initialization Multiplier: 1.6392082260409053
  Number of Layers: 3


Training Progress: 100%|██████████| 150/150 [00:05<00:00, 26.06it/s, loss=0.023162, elapsed time=0.03, total time=5.95]
[I 2025-06-07 22:04:42,871] Trial 9 finished with value: 0.023161810396659956 and parameters: {'learning_rate': 3.655338942353789e-05, 'sigma_multiplier': 1.8822787357169253, 'num_layers': 3, 'initialization_multiplier': 1.6392082260409053}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 9 final loss: 0.02316181
Trial 10:
  Learning Rate: 0.0681249192505627
  Sigma Multiplier: 1.4881954444865317
  Initialization Multiplier: 0.6924162937177465
  Number of Layers: 1


Training Progress: 100%|██████████| 150/150 [00:04<00:00, 36.10it/s, loss=-0.000065, elapsed time=0.02, total time=4.35]
[I 2025-06-07 22:04:47,255] Trial 10 finished with value: -6.54219587141118e-05 and parameters: {'learning_rate': 0.0681249192505627, 'sigma_multiplier': 1.4881954444865317, 'num_layers': 1, 'initialization_multiplier': 0.6924162937177465}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 10 final loss: -0.00006542
Trial 11:
  Learning Rate: 0.0003710752004593702
  Sigma Multiplier: 1.999592397165958
  Initialization Multiplier: 0.030752919117536442
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 19.37it/s, loss=0.015309, elapsed time=0.05, total time=7.94]
[I 2025-06-07 22:04:55,293] Trial 11 finished with value: 0.015309435066321713 and parameters: {'learning_rate': 0.0003710752004593702, 'sigma_multiplier': 1.999592397165958, 'num_layers': 5, 'initialization_multiplier': 0.030752919117536442}. Best is trial 2 with value: -0.0001893437554216291.


Training has not converged after 150 steps
Trial 11 final loss: 0.01530944
Trial 12:
  Learning Rate: 0.0549357762867691
  Sigma Multiplier: 1.651826183245932
  Initialization Multiplier: 0.6878366220675941
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.80it/s, loss=-0.000313, elapsed time=0.06, total time=8.62]
[I 2025-06-07 22:05:03,969] Trial 12 finished with value: -0.0003133227874394899 and parameters: {'learning_rate': 0.0549357762867691, 'sigma_multiplier': 1.651826183245932, 'num_layers': 5, 'initialization_multiplier': 0.6878366220675941}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 12 final loss: -0.00031332
Trial 13:
  Learning Rate: 0.05330461715630426
  Sigma Multiplier: 1.5504681795343647
  Initialization Multiplier: 0.7798502681297214
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 16.52it/s, loss=-0.000193, elapsed time=0.05, total time=9.33]
[I 2025-06-07 22:05:13,338] Trial 13 finished with value: -0.00019306572593139756 and parameters: {'learning_rate': 0.05330461715630426, 'sigma_multiplier': 1.5504681795343647, 'num_layers': 4, 'initialization_multiplier': 0.7798502681297214}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 13 final loss: -0.00019307
Trial 14:
  Learning Rate: 0.0864888977445141
  Sigma Multiplier: 1.456579063911973
  Initialization Multiplier: 0.7021897182372998
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.45it/s, loss=-0.000074, elapsed time=0.07, total time=10.7]
[I 2025-06-07 22:05:24,087] Trial 14 finished with value: -7.430280040869785e-05 and parameters: {'learning_rate': 0.0864888977445141, 'sigma_multiplier': 1.456579063911973, 'num_layers': 4, 'initialization_multiplier': 0.7021897182372998}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 14 final loss: -0.00007430
Trial 15:
  Learning Rate: 0.030383209851680172
  Sigma Multiplier: 1.1871145633741607
  Initialization Multiplier: 0.7982011796020455
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 23.17it/s, loss=0.000028, elapsed time=0.03, total time=6.72] 
[I 2025-06-07 22:05:30,846] Trial 15 finished with value: 2.798423645334503e-05 and parameters: {'learning_rate': 0.030383209851680172, 'sigma_multiplier': 1.1871145633741607, 'num_layers': 4, 'initialization_multiplier': 0.7982011796020455}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 15 final loss: 0.00002798
Trial 16:
  Learning Rate: 0.0005763075697943925
  Sigma Multiplier: 1.612238173944204
  Initialization Multiplier: 0.44189353896924677
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 22.02it/s, loss=0.018505, elapsed time=0.04, total time=7.01]
[I 2025-06-07 22:05:37,892] Trial 16 finished with value: 0.0185047300411923 and parameters: {'learning_rate': 0.0005763075697943925, 'sigma_multiplier': 1.612238173944204, 'num_layers': 5, 'initialization_multiplier': 0.44189353896924677}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 16 final loss: 0.01850473
Trial 17:
  Learning Rate: 0.007770007055989667
  Sigma Multiplier: 1.3025255792074875
  Initialization Multiplier: 1.0468322507991643
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 22.97it/s, loss=-0.000223, elapsed time=0.03, total time=6.74]
[I 2025-06-07 22:05:44,668] Trial 17 finished with value: -0.0002230208942895938 and parameters: {'learning_rate': 0.007770007055989667, 'sigma_multiplier': 1.3025255792074875, 'num_layers': 4, 'initialization_multiplier': 1.0468322507991643}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 17 final loss: -0.00022302
Trial 18:
  Learning Rate: 0.006753195798552224
  Sigma Multiplier: 1.2675020386024254
  Initialization Multiplier: 0.9846919297128365
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.73it/s, loss=-0.000042, elapsed time=0.06, total time=8.71]
[I 2025-06-07 22:05:53,421] Trial 18 finished with value: -4.1574364830257644e-05 and parameters: {'learning_rate': 0.006753195798552224, 'sigma_multiplier': 1.2675020386024254, 'num_layers': 5, 'initialization_multiplier': 0.9846919297128365}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 18 final loss: -0.00004157
Trial 19:
  Learning Rate: 0.01725338782282227
  Sigma Multiplier: 0.9863309354335646
  Initialization Multiplier: 1.0678773588044104
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 16.47it/s, loss=0.000469, elapsed time=0.06, total time=9.36]
[I 2025-06-07 22:06:02,827] Trial 19 finished with value: 0.00046935938102499154 and parameters: {'learning_rate': 0.01725338782282227, 'sigma_multiplier': 0.9863309354335646, 'num_layers': 4, 'initialization_multiplier': 1.0678773588044104}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 19 final loss: 0.00046936
Trial 20:
  Learning Rate: 0.0007994233129520713
  Sigma Multiplier: 0.8060537053033728
  Initialization Multiplier: 0.45259863180349713
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.15it/s, loss=0.032581, elapsed time=0.08, total time=10.8]
[I 2025-06-07 22:06:13,704] Trial 20 finished with value: 0.03258111352835142 and parameters: {'learning_rate': 0.0007994233129520713, 'sigma_multiplier': 0.8060537053033728, 'num_layers': 5, 'initialization_multiplier': 0.45259863180349713}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 20 final loss: 0.03258111
Trial 21:
  Learning Rate: 0.03833772253018618
  Sigma Multiplier: 1.6510109866164102
  Initialization Multiplier: 0.9392531220158135
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.28it/s, loss=-0.000114, elapsed time=0.05, total time=8.93]
[I 2025-06-07 22:06:22,682] Trial 21 finished with value: -0.00011368799630803551 and parameters: {'learning_rate': 0.03833772253018618, 'sigma_multiplier': 1.6510109866164102, 'num_layers': 4, 'initialization_multiplier': 0.9392531220158135}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 21 final loss: -0.00011369
Trial 22:
  Learning Rate: 0.05750034926280035
  Sigma Multiplier: 1.3083564866161552
  Initialization Multiplier: 0.5281647644481209
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.59it/s, loss=-0.000214, elapsed time=0.07, total time=9.88]
[I 2025-06-07 22:06:32,624] Trial 22 finished with value: -0.00021428751444938608 and parameters: {'learning_rate': 0.05750034926280035, 'sigma_multiplier': 1.3083564866161552, 'num_layers': 4, 'initialization_multiplier': 0.5281647644481209}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 22 final loss: -0.00021429
Trial 23:
  Learning Rate: 0.008203787386496797
  Sigma Multiplier: 1.3058717194678942
  Initialization Multiplier: 0.5419398845529613
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 16.88it/s, loss=-0.000180, elapsed time=0.04, total time=9.4] 
[I 2025-06-07 22:06:42,105] Trial 23 finished with value: -0.00017950729721892734 and parameters: {'learning_rate': 0.008203787386496797, 'sigma_multiplier': 1.3058717194678942, 'num_layers': 5, 'initialization_multiplier': 0.5419398845529613}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 23 final loss: -0.00017951
Trial 24:
  Learning Rate: 0.08789634422822785
  Sigma Multiplier: 1.071293752369165
  Initialization Multiplier: 0.3069991797589396
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 20.00it/s, loss=0.000283, elapsed time=0.04, total time=7.73]
[I 2025-06-07 22:06:49,917] Trial 24 finished with value: 0.0002826602564039448 and parameters: {'learning_rate': 0.08789634422822785, 'sigma_multiplier': 1.071293752369165, 'num_layers': 4, 'initialization_multiplier': 0.3069991797589396}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 24 final loss: 0.00028266
Trial 25:
  Learning Rate: 0.02089786561242671
  Sigma Multiplier: 1.6933696199493125
  Initialization Multiplier: 1.1654609476884543
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 21.51it/s, loss=-0.000278, elapsed time=0.04, total time=7.2] 
[I 2025-06-07 22:06:57,164] Trial 25 finished with value: -0.00027826016585099907 and parameters: {'learning_rate': 0.02089786561242671, 'sigma_multiplier': 1.6933696199493125, 'num_layers': 4, 'initialization_multiplier': 1.1654609476884543}. Best is trial 12 with value: -0.0003133227874394899.


Training has not converged after 150 steps
Trial 25 final loss: -0.00027826
Trial 26:
  Learning Rate: 0.015208316835819287
  Sigma Multiplier: 1.7386064848638172
  Initialization Multiplier: 1.1502284775750224
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 18.71it/s, loss=-0.000377, elapsed time=0.04, total time=8.23]
[I 2025-06-07 22:07:05,438] Trial 26 finished with value: -0.00037698664368775723 and parameters: {'learning_rate': 0.015208316835819287, 'sigma_multiplier': 1.7386064848638172, 'num_layers': 5, 'initialization_multiplier': 1.1502284775750224}. Best is trial 26 with value: -0.00037698664368775723.


Training has not converged after 150 steps
Trial 26 final loss: -0.00037699
Trial 27:
  Learning Rate: 0.021106451336123183
  Sigma Multiplier: 1.709815623303937
  Initialization Multiplier: 1.1681174752013497
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 19.12it/s, loss=-0.000401, elapsed time=0.12, total time=8.1] 
[I 2025-06-07 22:07:13,583] Trial 27 finished with value: -0.0004005343397201333 and parameters: {'learning_rate': 0.021106451336123183, 'sigma_multiplier': 1.709815623303937, 'num_layers': 5, 'initialization_multiplier': 1.1681174752013497}. Best is trial 27 with value: -0.0004005343397201333.


Training has not converged after 150 steps
Trial 27 final loss: -0.00040053
Trial 28:
  Learning Rate: 0.0012644712517016214
  Sigma Multiplier: 1.9899353221578642
  Initialization Multiplier: 0.9051066730507569
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 18.90it/s, loss=0.003217, elapsed time=0.04, total time=8.21]
[I 2025-06-07 22:07:21,841] Trial 28 finished with value: 0.003216917614658499 and parameters: {'learning_rate': 0.0012644712517016214, 'sigma_multiplier': 1.9899353221578642, 'num_layers': 5, 'initialization_multiplier': 0.9051066730507569}. Best is trial 27 with value: -0.0004005343397201333.


Training has not converged after 150 steps
Trial 28 final loss: 0.00321692
Trial 29:
  Learning Rate: 0.0045563940293539005
  Sigma Multiplier: 1.8058592962242597
  Initialization Multiplier: 1.282254477867797
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 18.97it/s, loss=-0.000332, elapsed time=0.04, total time=8.16]
[I 2025-06-07 22:07:30,060] Trial 29 finished with value: -0.0003321331412526002 and parameters: {'learning_rate': 0.0045563940293539005, 'sigma_multiplier': 1.8058592962242597, 'num_layers': 5, 'initialization_multiplier': 1.282254477867797}. Best is trial 27 with value: -0.0004005343397201333.


Training has not converged after 150 steps
Trial 29 final loss: -0.00033213
Trial 30:
  Learning Rate: 0.004076820101027265
  Sigma Multiplier: 1.8138303909482594
  Initialization Multiplier: 1.4549483466261603
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 18.63it/s, loss=-0.000121, elapsed time=0.04, total time=8.28]
[I 2025-06-07 22:07:38,393] Trial 30 finished with value: -0.00012065837657242618 and parameters: {'learning_rate': 0.004076820101027265, 'sigma_multiplier': 1.8138303909482594, 'num_layers': 5, 'initialization_multiplier': 1.4549483466261603}. Best is trial 27 with value: -0.0004005343397201333.


Training has not converged after 150 steps
Trial 30 final loss: -0.00012066
Trial 31:
  Learning Rate: 0.004841803196493974
  Sigma Multiplier: 1.7083833107614552
  Initialization Multiplier: 1.1473277159141926
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:18<00:00,  8.17it/s, loss=-0.000512, elapsed time=0.05, total time=18.6]
[I 2025-06-07 22:07:57,096] Trial 31 finished with value: -0.0005117636395648089 and parameters: {'learning_rate': 0.004841803196493974, 'sigma_multiplier': 1.7083833107614552, 'num_layers': 5, 'initialization_multiplier': 1.1473277159141926}. Best is trial 31 with value: -0.0005117636395648089.


Training has not converged after 150 steps
Trial 31 final loss: -0.00051176
Trial 32:
  Learning Rate: 0.011702938199907172
  Sigma Multiplier: 1.8767046559714242
  Initialization Multiplier: 1.3963044843604016
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.02it/s, loss=-0.000264, elapsed time=0.05, total time=9.34]
[I 2025-06-07 22:08:06,499] Trial 32 finished with value: -0.00026426163902990897 and parameters: {'learning_rate': 0.011702938199907172, 'sigma_multiplier': 1.8767046559714242, 'num_layers': 5, 'initialization_multiplier': 1.3963044843604016}. Best is trial 31 with value: -0.0005117636395648089.


Training has not converged after 150 steps
Trial 32 final loss: -0.00026426
Trial 33:
  Learning Rate: 0.004385328401118367
  Sigma Multiplier: 1.7463403748697206
  Initialization Multiplier: 1.1611532209901585
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.67it/s, loss=-0.000298, elapsed time=0.06, total time=8.72]
[I 2025-06-07 22:08:15,270] Trial 33 finished with value: -0.0002976632469612262 and parameters: {'learning_rate': 0.004385328401118367, 'sigma_multiplier': 1.7463403748697206, 'num_layers': 5, 'initialization_multiplier': 1.1611532209901585}. Best is trial 31 with value: -0.0005117636395648089.


Training has not converged after 150 steps
Trial 33 final loss: -0.00029766
Trial 34:
  Learning Rate: 0.022252442050367485
  Sigma Multiplier: 1.8722876810435451
  Initialization Multiplier: 1.285316454234171
  Number of Layers: 2


Training Progress: 100%|██████████| 150/150 [00:05<00:00, 26.16it/s, loss=-0.000153, elapsed time=0.03, total time=6.04]
[I 2025-06-07 22:08:21,346] Trial 34 finished with value: -0.0001533095111918868 and parameters: {'learning_rate': 0.022252442050367485, 'sigma_multiplier': 1.8722876810435451, 'num_layers': 2, 'initialization_multiplier': 1.285316454234171}. Best is trial 31 with value: -0.0005117636395648089.


Training has not converged after 150 steps
Trial 34 final loss: -0.00015331
Trial 35:
  Learning Rate: 0.00165117009981167
  Sigma Multiplier: 1.5381192375752735
  Initialization Multiplier: 1.1486966931528078
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.18it/s, loss=-0.000008, elapsed time=0.04, total time=9.01]
[I 2025-06-07 22:08:30,422] Trial 35 finished with value: -7.537186033726149e-06 and parameters: {'learning_rate': 0.00165117009981167, 'sigma_multiplier': 1.5381192375752735, 'num_layers': 5, 'initialization_multiplier': 1.1486966931528078}. Best is trial 31 with value: -0.0005117636395648089.


Training has not converged after 150 steps
Trial 35 final loss: -0.00000754
Trial 36:
  Learning Rate: 0.006066136921539601
  Sigma Multiplier: 1.7489988792851965
  Initialization Multiplier: 1.498911367336564
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 18.18it/s, loss=-0.000343, elapsed time=0.04, total time=8.47]
[I 2025-06-07 22:08:38,950] Trial 36 finished with value: -0.00034308373028931214 and parameters: {'learning_rate': 0.006066136921539601, 'sigma_multiplier': 1.7489988792851965, 'num_layers': 5, 'initialization_multiplier': 1.498911367336564}. Best is trial 31 with value: -0.0005117636395648089.


Training has not converged after 150 steps
Trial 36 final loss: -0.00034308
Trial 37:
  Learning Rate: 0.012529922603919507
  Sigma Multiplier: 1.4402562057733146
  Initialization Multiplier: 1.9680596739001786
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 16.74it/s, loss=-0.000584, elapsed time=0.07, total time=9.17]
[I 2025-06-07 22:08:48,168] Trial 37 finished with value: -0.0005842494105895364 and parameters: {'learning_rate': 0.012529922603919507, 'sigma_multiplier': 1.4402562057733146, 'num_layers': 5, 'initialization_multiplier': 1.9680596739001786}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 37 final loss: -0.00058425
Trial 38:
  Learning Rate: 0.011606287234049568
  Sigma Multiplier: 1.4440328575214068
  Initialization Multiplier: 1.9966070914676461
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 16.83it/s, loss=-0.000201, elapsed time=0.05, total time=9.22]
[I 2025-06-07 22:08:57,451] Trial 38 finished with value: -0.00020093989038575918 and parameters: {'learning_rate': 0.011606287234049568, 'sigma_multiplier': 1.4440328575214068, 'num_layers': 5, 'initialization_multiplier': 1.9966070914676461}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 38 final loss: -0.00020094
Trial 39:
  Learning Rate: 0.03701092636262711
  Sigma Multiplier: 1.3702046034300543
  Initialization Multiplier: 1.8639660365162882
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 16.36it/s, loss=-0.000186, elapsed time=0.06, total time=9.5] 
[I 2025-06-07 22:09:06,999] Trial 39 finished with value: -0.00018607923125758713 and parameters: {'learning_rate': 0.03701092636262711, 'sigma_multiplier': 1.3702046034300543, 'num_layers': 5, 'initialization_multiplier': 1.8639660365162882}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 39 final loss: -0.00018608
Trial 40:
  Learning Rate: 0.002656432816941807
  Sigma Multiplier: 1.5339498323923155
  Initialization Multiplier: 1.755118199220644
  Number of Layers: 3


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 19.47it/s, loss=0.000614, elapsed time=0.05, total time=7.92]
[I 2025-06-07 22:09:14,963] Trial 40 finished with value: 0.0006140396708353135 and parameters: {'learning_rate': 0.002656432816941807, 'sigma_multiplier': 1.5339498323923155, 'num_layers': 3, 'initialization_multiplier': 1.755118199220644}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 40 final loss: 0.00061404
Trial 41:
  Learning Rate: 0.005836697760031179
  Sigma Multiplier: 1.7353641251762846
  Initialization Multiplier: 1.481219118558474
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 16.85it/s, loss=-0.000364, elapsed time=0.05, total time=9.18]
[I 2025-06-07 22:09:24,212] Trial 41 finished with value: -0.0003637576196678706 and parameters: {'learning_rate': 0.005836697760031179, 'sigma_multiplier': 1.7353641251762846, 'num_layers': 5, 'initialization_multiplier': 1.481219118558474}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 41 final loss: -0.00036376
Trial 42:
  Learning Rate: 0.014023874493731932
  Sigma Multiplier: 1.5976172354058615
  Initialization Multiplier: 1.366128283540769
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 16.19it/s, loss=-0.000327, elapsed time=0.06, total time=9.54]
[I 2025-06-07 22:09:33,797] Trial 42 finished with value: -0.0003267906082841856 and parameters: {'learning_rate': 0.014023874493731932, 'sigma_multiplier': 1.5976172354058615, 'num_layers': 5, 'initialization_multiplier': 1.366128283540769}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 42 final loss: -0.00032679
Trial 43:
  Learning Rate: 0.008312715741666685
  Sigma Multiplier: 1.9080493446110842
  Initialization Multiplier: 1.5510458015662814
  Number of Layers: 2


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 24.37it/s, loss=-0.000002, elapsed time=0.03, total time=6.5] 
[I 2025-06-07 22:09:40,343] Trial 43 finished with value: -2.488357184431328e-06 and parameters: {'learning_rate': 0.008312715741666685, 'sigma_multiplier': 1.9080493446110842, 'num_layers': 2, 'initialization_multiplier': 1.5510458015662814}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 43 final loss: -0.00000249
Trial 44:
  Learning Rate: 0.022942048018567127
  Sigma Multiplier: 0.1395879163440651
  Initialization Multiplier: 1.187280251668335
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:14<00:00, 10.60it/s, loss=-0.000062, elapsed time=0.09, total time=14.4]
[I 2025-06-07 22:09:54,834] Trial 44 finished with value: -6.216670074021733e-05 and parameters: {'learning_rate': 0.022942048018567127, 'sigma_multiplier': 0.1395879163440651, 'num_layers': 5, 'initialization_multiplier': 1.187280251668335}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 44 final loss: -0.00006217
Trial 45:
  Learning Rate: 0.003008110175771984
  Sigma Multiplier: 1.7395178723350015
  Initialization Multiplier: 1.9707455674416576
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.12it/s, loss=-0.000019, elapsed time=0.07, total time=10.9]
[I 2025-06-07 22:10:05,822] Trial 45 finished with value: -1.8796332659282585e-05 and parameters: {'learning_rate': 0.003008110175771984, 'sigma_multiplier': 1.7395178723350015, 'num_layers': 5, 'initialization_multiplier': 1.9707455674416576}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 45 final loss: -0.00001880
Trial 46:
  Learning Rate: 0.013209506323717325
  Sigma Multiplier: 1.6435572869351018
  Initialization Multiplier: 1.7080079788292832
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.27it/s, loss=-0.000227, elapsed time=0.05, total time=10.2]
[I 2025-06-07 22:10:16,066] Trial 46 finished with value: -0.00022723617421588574 and parameters: {'learning_rate': 0.013209506323717325, 'sigma_multiplier': 1.6435572869351018, 'num_layers': 4, 'initialization_multiplier': 1.7080079788292832}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 46 final loss: -0.00022724
Trial 47:
  Learning Rate: 0.0017801482878866623
  Sigma Multiplier: 1.4092594139588919
  Initialization Multiplier: 1.368874344593956
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:15<00:00,  9.90it/s, loss=-0.000079, elapsed time=0.11, total time=15.4]
[I 2025-06-07 22:10:31,562] Trial 47 finished with value: -7.928887704186303e-05 and parameters: {'learning_rate': 0.0017801482878866623, 'sigma_multiplier': 1.4092594139588919, 'num_layers': 5, 'initialization_multiplier': 1.368874344593956}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 47 final loss: -0.00007929
Trial 48:
  Learning Rate: 0.005396182502225106
  Sigma Multiplier: 1.9345264807844633
  Initialization Multiplier: 0.8629545442845292
  Number of Layers: 1


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 21.35it/s, loss=0.001557, elapsed time=0.04, total time=7.82]
[I 2025-06-07 22:10:39,447] Trial 48 finished with value: 0.0015573582626654235 and parameters: {'learning_rate': 0.005396182502225106, 'sigma_multiplier': 1.9345264807844633, 'num_layers': 1, 'initialization_multiplier': 0.8629545442845292}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 48 final loss: 0.00155736
Trial 49:
  Learning Rate: 0.00015521194626377227
  Sigma Multiplier: 1.6804154053586122
  Initialization Multiplier: 1.0547288841967037
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.40it/s, loss=0.039138, elapsed time=0.05, total time=10.1]
[I 2025-06-07 22:10:49,597] Trial 49 finished with value: 0.03913805529285837 and parameters: {'learning_rate': 0.00015521194626377227, 'sigma_multiplier': 1.6804154053586122, 'num_layers': 4, 'initialization_multiplier': 1.0547288841967037}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 49 final loss: 0.03913806
Trial 50:
  Learning Rate: 0.009616049035070432
  Sigma Multiplier: 1.8195576647062186
  Initialization Multiplier: 1.6203078951482002
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.26it/s, loss=-0.000349, elapsed time=0.06, total time=10.8]
[I 2025-06-07 22:11:00,546] Trial 50 finished with value: -0.00034866648873064387 and parameters: {'learning_rate': 0.009616049035070432, 'sigma_multiplier': 1.8195576647062186, 'num_layers': 5, 'initialization_multiplier': 1.6203078951482002}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 50 final loss: -0.00034867
Trial 51:
  Learning Rate: 0.010221295437447025
  Sigma Multiplier: 1.8178733776684441
  Initialization Multiplier: 1.8232957074385563
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.17it/s, loss=-0.000265, elapsed time=0.05, total time=8.99]
[I 2025-06-07 22:11:09,612] Trial 51 finished with value: -0.0002647690800080762 and parameters: {'learning_rate': 0.010221295437447025, 'sigma_multiplier': 1.8178733776684441, 'num_layers': 5, 'initialization_multiplier': 1.8232957074385563}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 51 final loss: -0.00026477
Trial 52:
  Learning Rate: 0.017554719514039353
  Sigma Multiplier: 1.5112107379752833
  Initialization Multiplier: 1.6126363039387033
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.35it/s, loss=-0.000238, elapsed time=0.05, total time=8.94]
[I 2025-06-07 22:11:18,605] Trial 52 finished with value: -0.00023828972140513526 and parameters: {'learning_rate': 0.017554719514039353, 'sigma_multiplier': 1.5112107379752833, 'num_layers': 5, 'initialization_multiplier': 1.6126363039387033}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 52 final loss: -0.00023829
Trial 53:
  Learning Rate: 0.030115520534273042
  Sigma Multiplier: 1.5860601962228582
  Initialization Multiplier: 1.5139257463660374
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.90it/s, loss=-0.000138, elapsed time=0.05, total time=8.61]
[I 2025-06-07 22:11:27,294] Trial 53 finished with value: -0.00013767265636067616 and parameters: {'learning_rate': 0.030115520534273042, 'sigma_multiplier': 1.5860601962228582, 'num_layers': 5, 'initialization_multiplier': 1.5139257463660374}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 53 final loss: -0.00013767
Trial 54:
  Learning Rate: 0.00593150156455367
  Sigma Multiplier: 1.7258788735531811
  Initialization Multiplier: 1.75161833109152
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.54it/s, loss=-0.000361, elapsed time=0.04, total time=9.86]
[I 2025-06-07 22:11:37,222] Trial 54 finished with value: -0.00036110979467653565 and parameters: {'learning_rate': 0.00593150156455367, 'sigma_multiplier': 1.7258788735531811, 'num_layers': 5, 'initialization_multiplier': 1.75161833109152}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 54 final loss: -0.00036111
Trial 55:
  Learning Rate: 0.0030631988592356987
  Sigma Multiplier: 0.6042447232026906
  Initialization Multiplier: 1.776180132750585
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:12<00:00, 12.45it/s, loss=0.003807, elapsed time=0.08, total time=12.3]
[I 2025-06-07 22:11:49,580] Trial 55 finished with value: 0.003806970209396945 and parameters: {'learning_rate': 0.0030631988592356987, 'sigma_multiplier': 0.6042447232026906, 'num_layers': 5, 'initialization_multiplier': 1.776180132750585}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 55 final loss: 0.00380697
Trial 56:
  Learning Rate: 0.006875370866277081
  Sigma Multiplier: 1.69515320797615
  Initialization Multiplier: 1.928044722537964
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.10it/s, loss=-0.000447, elapsed time=0.06, total time=9.03]
[I 2025-06-07 22:11:58,658] Trial 56 finished with value: -0.00044674874153465173 and parameters: {'learning_rate': 0.006875370866277081, 'sigma_multiplier': 1.69515320797615, 'num_layers': 4, 'initialization_multiplier': 1.928044722537964}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 56 final loss: -0.00044675
Trial 57:
  Learning Rate: 0.01676448348888097
  Sigma Multiplier: 1.1991327301113057
  Initialization Multiplier: 1.8948471905097661
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.61it/s, loss=-0.000044, elapsed time=0.05, total time=9.89]
[I 2025-06-07 22:12:08,593] Trial 57 finished with value: -4.37452225348326e-05 and parameters: {'learning_rate': 0.01676448348888097, 'sigma_multiplier': 1.1991327301113057, 'num_layers': 4, 'initialization_multiplier': 1.8948471905097661}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 57 final loss: -0.00004375
Trial 58:
  Learning Rate: 0.04279578306584678
  Sigma Multiplier: 1.3767473255944895
  Initialization Multiplier: 1.2192655366228982
  Number of Layers: 3


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.90it/s, loss=-0.000196, elapsed time=0.05, total time=8.64]
[I 2025-06-07 22:12:17,280] Trial 58 finished with value: -0.0001956983824431428 and parameters: {'learning_rate': 0.04279578306584678, 'sigma_multiplier': 1.3767473255944895, 'num_layers': 3, 'initialization_multiplier': 1.2192655366228982}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 58 final loss: -0.00019570
Trial 59:
  Learning Rate: 0.0020459369591399896
  Sigma Multiplier: 1.9554975907565622
  Initialization Multiplier: 1.9398291060906745
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 18.41it/s, loss=0.000014, elapsed time=0.04, total time=8.43]
[I 2025-06-07 22:12:25,762] Trial 59 finished with value: 1.4350127632982684e-05 and parameters: {'learning_rate': 0.0020459369591399896, 'sigma_multiplier': 1.9554975907565622, 'num_layers': 4, 'initialization_multiplier': 1.9398291060906745}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 59 final loss: 0.00001435
Trial 60:
  Learning Rate: 0.0011082109316928029
  Sigma Multiplier: 1.591705871523518
  Initialization Multiplier: 1.0838383940937213
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 16.74it/s, loss=0.013458, elapsed time=0.06, total time=9.25]
[I 2025-06-07 22:12:35,065] Trial 60 finished with value: 0.013458091886481054 and parameters: {'learning_rate': 0.0011082109316928029, 'sigma_multiplier': 1.591705871523518, 'num_layers': 4, 'initialization_multiplier': 1.0838383940937213}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 60 final loss: 0.01345809
Trial 61:
  Learning Rate: 0.006442010308651362
  Sigma Multiplier: 1.7149037729846885
  Initialization Multiplier: 1.6913161263982601
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.86it/s, loss=-0.000182, elapsed time=0.05, total time=10.3]
[I 2025-06-07 22:12:45,465] Trial 61 finished with value: -0.0001816301140638193 and parameters: {'learning_rate': 0.006442010308651362, 'sigma_multiplier': 1.7149037729846885, 'num_layers': 5, 'initialization_multiplier': 1.6913161263982601}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 61 final loss: -0.00018163
Trial 62:
  Learning Rate: 0.0035065536295566403
  Sigma Multiplier: 1.6738622220472998
  Initialization Multiplier: 1.849347520949663
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.48it/s, loss=-0.000333, elapsed time=0.05, total time=9.98]
[I 2025-06-07 22:12:55,500] Trial 62 finished with value: -0.00033289724128203533 and parameters: {'learning_rate': 0.0035065536295566403, 'sigma_multiplier': 1.6738622220472998, 'num_layers': 5, 'initialization_multiplier': 1.849347520949663}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 62 final loss: -0.00033290
Trial 63:
  Learning Rate: 0.0052358613521128325
  Sigma Multiplier: 1.4802531236638112
  Initialization Multiplier: 1.7005351334039895
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.92it/s, loss=-0.000111, elapsed time=0.05, total time=10.3]
[I 2025-06-07 22:13:05,886] Trial 63 finished with value: -0.00011060045178605772 and parameters: {'learning_rate': 0.0052358613521128325, 'sigma_multiplier': 1.4802531236638112, 'num_layers': 5, 'initialization_multiplier': 1.7005351334039895}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 63 final loss: -0.00011060
Trial 64:
  Learning Rate: 0.006879556774207171
  Sigma Multiplier: 1.842994588086008
  Initialization Multiplier: 1.935937494154895
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.98it/s, loss=-0.000372, elapsed time=0.06, total time=10.3]
[I 2025-06-07 22:13:16,291] Trial 64 finished with value: -0.0003715943664891626 and parameters: {'learning_rate': 0.006879556774207171, 'sigma_multiplier': 1.842994588086008, 'num_layers': 5, 'initialization_multiplier': 1.935937494154895}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 64 final loss: -0.00037159
Trial 65:
  Learning Rate: 0.008104311661842313
  Sigma Multiplier: 1.7803791930602377
  Initialization Multiplier: 0.9843848303763698
  Number of Layers: 3


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 18.91it/s, loss=-0.000285, elapsed time=0.04, total time=8.24]
[I 2025-06-07 22:13:24,578] Trial 65 finished with value: -0.00028478431775125234 and parameters: {'learning_rate': 0.008104311661842313, 'sigma_multiplier': 1.7803791930602377, 'num_layers': 3, 'initialization_multiplier': 0.9843848303763698}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 65 final loss: -0.00028478
Trial 66:
  Learning Rate: 0.026547241743484242
  Sigma Multiplier: 1.9071632887479704
  Initialization Multiplier: 1.909508835598454
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.77it/s, loss=-0.000264, elapsed time=0.06, total time=10.4]
[I 2025-06-07 22:13:35,065] Trial 66 finished with value: -0.0002636795266488511 and parameters: {'learning_rate': 0.026547241743484242, 'sigma_multiplier': 1.9071632887479704, 'num_layers': 5, 'initialization_multiplier': 1.909508835598454}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 66 final loss: -0.00026368
Trial 67:
  Learning Rate: 0.010055232242945812
  Sigma Multiplier: 1.8299347184860522
  Initialization Multiplier: 1.9988210023225599
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 16.19it/s, loss=-0.000135, elapsed time=0.05, total time=9.51]
[I 2025-06-07 22:13:44,631] Trial 67 finished with value: -0.00013462536200789817 and parameters: {'learning_rate': 0.010055232242945812, 'sigma_multiplier': 1.8299347184860522, 'num_layers': 4, 'initialization_multiplier': 1.9988210023225599}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 67 final loss: -0.00013463
Trial 68:
  Learning Rate: 0.01556353582494675
  Sigma Multiplier: 1.6323530945831817
  Initialization Multiplier: 1.3043550900653806
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.63it/s, loss=-0.000378, elapsed time=0.05, total time=10.6]
[I 2025-06-07 22:13:55,297] Trial 68 finished with value: -0.0003784896974287022 and parameters: {'learning_rate': 0.01556353582494675, 'sigma_multiplier': 1.6323530945831817, 'num_layers': 5, 'initialization_multiplier': 1.3043550900653806}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 68 final loss: -0.00037849
Trial 69:
  Learning Rate: 0.016710637374099255
  Sigma Multiplier: 1.6408752786979435
  Initialization Multiplier: 1.3410459360266822
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.96it/s, loss=-0.000302, elapsed time=0.06, total time=10.3]
[I 2025-06-07 22:14:05,672] Trial 69 finished with value: -0.0003016749137453978 and parameters: {'learning_rate': 0.016710637374099255, 'sigma_multiplier': 1.6408752786979435, 'num_layers': 5, 'initialization_multiplier': 1.3410459360266822}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 69 final loss: -0.00030167
Trial 70:
  Learning Rate: 0.020753177878291496
  Sigma Multiplier: 1.998030728683398
  Initialization Multiplier: 1.090385840112616
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.01it/s, loss=-0.000279, elapsed time=0.05, total time=9.11]
[I 2025-06-07 22:14:14,834] Trial 70 finished with value: -0.00027903154917907576 and parameters: {'learning_rate': 0.020753177878291496, 'sigma_multiplier': 1.998030728683398, 'num_layers': 4, 'initialization_multiplier': 1.090385840112616}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 70 final loss: -0.00027903
Trial 71:
  Learning Rate: 0.014161274287033836
  Sigma Multiplier: 1.8492370095940618
  Initialization Multiplier: 1.1245266421492515
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.50it/s, loss=-0.000201, elapsed time=0.06, total time=9.99]
[I 2025-06-07 22:14:24,885] Trial 71 finished with value: -0.0002013521905447555 and parameters: {'learning_rate': 0.014161274287033836, 'sigma_multiplier': 1.8492370095940618, 'num_layers': 5, 'initialization_multiplier': 1.1245266421492515}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 71 final loss: -0.00020135
Trial 72:
  Learning Rate: 0.00785107318624881
  Sigma Multiplier: 1.7802135954777059
  Initialization Multiplier: 1.2562206238457971
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.12it/s, loss=-0.000320, elapsed time=0.04, total time=10.3]
[I 2025-06-07 22:14:35,214] Trial 72 finished with value: -0.0003202161937645119 and parameters: {'learning_rate': 0.00785107318624881, 'sigma_multiplier': 1.7802135954777059, 'num_layers': 5, 'initialization_multiplier': 1.2562206238457971}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 72 final loss: -0.00032022
Trial 73:
  Learning Rate: 3.111819087882262e-05
  Sigma Multiplier: 1.58373247951347
  Initialization Multiplier: 1.3112150657041495
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.47it/s, loss=0.057523, elapsed time=0.06, total time=10.1]
[I 2025-06-07 22:14:45,314] Trial 73 finished with value: 0.0575231600276218 and parameters: {'learning_rate': 3.111819087882262e-05, 'sigma_multiplier': 1.58373247951347, 'num_layers': 5, 'initialization_multiplier': 1.3112150657041495}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 73 final loss: 0.05752316
Trial 74:
  Learning Rate: 0.004205244706125702
  Sigma Multiplier: 1.695556933868408
  Initialization Multiplier: 1.2229493526995687
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.58it/s, loss=0.001210, elapsed time=0.05, total time=9.94]
[I 2025-06-07 22:14:55,314] Trial 74 finished with value: 0.00120977601224497 and parameters: {'learning_rate': 0.004205244706125702, 'sigma_multiplier': 1.695556933868408, 'num_layers': 5, 'initialization_multiplier': 1.2229493526995687}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 74 final loss: 0.00120978
Trial 75:
  Learning Rate: 0.012360604420595691
  Sigma Multiplier: 1.7723446306418216
  Initialization Multiplier: 0.9805830995861233
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.07it/s, loss=-0.000154, elapsed time=0.05, total time=10.2]
[I 2025-06-07 22:15:05,591] Trial 75 finished with value: -0.00015445581484523757 and parameters: {'learning_rate': 0.012360604420595691, 'sigma_multiplier': 1.7723446306418216, 'num_layers': 5, 'initialization_multiplier': 0.9805830995861233}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 75 final loss: -0.00015446
Trial 76:
  Learning Rate: 0.007173932750605358
  Sigma Multiplier: 0.8907279456263817
  Initialization Multiplier: 1.4522336119886257
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 13.96it/s, loss=0.000609, elapsed time=0.06, total time=11]  
[I 2025-06-07 22:15:16,669] Trial 76 finished with value: 0.0006086811753909946 and parameters: {'learning_rate': 0.007173932750605358, 'sigma_multiplier': 0.8907279456263817, 'num_layers': 5, 'initialization_multiplier': 1.4522336119886257}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 76 final loss: 0.00060868
Trial 77:
  Learning Rate: 0.025545241216651533
  Sigma Multiplier: 1.5356667874723395
  Initialization Multiplier: 1.4451632157410044
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.30it/s, loss=-0.000251, elapsed time=0.07, total time=10.1]
[I 2025-06-07 22:15:26,851] Trial 77 finished with value: -0.00025080279709363985 and parameters: {'learning_rate': 0.025545241216651533, 'sigma_multiplier': 1.5356667874723395, 'num_layers': 5, 'initialization_multiplier': 1.4451632157410044}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 77 final loss: -0.00025080
Trial 78:
  Learning Rate: 0.037893661562045926
  Sigma Multiplier: 1.6311274718730533
  Initialization Multiplier: 1.7916116660048513
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.61it/s, loss=-0.000284, elapsed time=0.04, total time=9.99]
[I 2025-06-07 22:15:36,905] Trial 78 finished with value: -0.0002842614376090371 and parameters: {'learning_rate': 0.037893661562045926, 'sigma_multiplier': 1.6311274718730533, 'num_layers': 5, 'initialization_multiplier': 1.7916116660048513}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 78 final loss: -0.00028426
Trial 79:
  Learning Rate: 0.005179243589698433
  Sigma Multiplier: 1.447678198987766
  Initialization Multiplier: 0.8429464411494934
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.59it/s, loss=0.004078, elapsed time=0.06, total time=9.88]
[I 2025-06-07 22:15:46,831] Trial 79 finished with value: 0.0040779257162024286 and parameters: {'learning_rate': 0.005179243589698433, 'sigma_multiplier': 1.447678198987766, 'num_layers': 5, 'initialization_multiplier': 0.8429464411494934}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 79 final loss: 0.00407793
Trial 80:
  Learning Rate: 0.01799804226617657
  Sigma Multiplier: 1.869696694956377
  Initialization Multiplier: 1.1204819871974334
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 16.57it/s, loss=-0.000183, elapsed time=0.05, total time=9.38]
[I 2025-06-07 22:15:56,261] Trial 80 finished with value: -0.00018287121724193213 and parameters: {'learning_rate': 0.01799804226617657, 'sigma_multiplier': 1.869696694956377, 'num_layers': 4, 'initialization_multiplier': 1.1204819871974334}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 80 final loss: -0.00018287
Trial 81:
  Learning Rate: 0.00935395773813779
  Sigma Multiplier: 1.7095327982656938
  Initialization Multiplier: 1.9360621267100127
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.02it/s, loss=-0.000208, elapsed time=0.05, total time=10.3]
[I 2025-06-07 22:16:06,648] Trial 81 finished with value: -0.00020847758187596542 and parameters: {'learning_rate': 0.00935395773813779, 'sigma_multiplier': 1.7095327982656938, 'num_layers': 5, 'initialization_multiplier': 1.9360621267100127}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 81 final loss: -0.00020848
Trial 82:
  Learning Rate: 0.005970328480375231
  Sigma Multiplier: 1.735390213107322
  Initialization Multiplier: 1.8791293519073022
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:10<00:00, 14.97it/s, loss=-0.000116, elapsed time=0.06, total time=10.4]
[I 2025-06-07 22:16:17,105] Trial 82 finished with value: -0.00011644263630474374 and parameters: {'learning_rate': 0.005970328480375231, 'sigma_multiplier': 1.735390213107322, 'num_layers': 5, 'initialization_multiplier': 1.8791293519073022}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 82 final loss: -0.00011644
Trial 83:
  Learning Rate: 0.0037024512697230354
  Sigma Multiplier: 1.659949881504735
  Initialization Multiplier: 1.74240266744932
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 16.01it/s, loss=-0.000043, elapsed time=0.04, total time=9.64]
[I 2025-06-07 22:16:26,800] Trial 83 finished with value: -4.271591523588522e-05 and parameters: {'learning_rate': 0.0037024512697230354, 'sigma_multiplier': 1.659949881504735, 'num_layers': 5, 'initialization_multiplier': 1.74240266744932}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 83 final loss: -0.00004272
Trial 84:
  Learning Rate: 0.0022766641662732025
  Sigma Multiplier: 1.5637096263336208
  Initialization Multiplier: 0.061610004381664085
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.22it/s, loss=0.000056, elapsed time=0.05, total time=10.1] 
[I 2025-06-07 22:16:36,952] Trial 84 finished with value: 5.551126637697755e-05 and parameters: {'learning_rate': 0.0022766641662732025, 'sigma_multiplier': 1.5637096263336208, 'num_layers': 5, 'initialization_multiplier': 0.061610004381664085}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 84 final loss: 0.00005551
Trial 85:
  Learning Rate: 0.006847105783113455
  Sigma Multiplier: 1.946310001382183
  Initialization Multiplier: 1.659025920856826
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.09it/s, loss=-0.000195, elapsed time=0.08, total time=10.2]
[I 2025-06-07 22:16:47,207] Trial 85 finished with value: -0.00019480849924726244 and parameters: {'learning_rate': 0.006847105783113455, 'sigma_multiplier': 1.946310001382183, 'num_layers': 5, 'initialization_multiplier': 1.659025920856826}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 85 final loss: -0.00019481
Trial 86:
  Learning Rate: 0.011333197531916332
  Sigma Multiplier: 1.7593152222219806
  Initialization Multiplier: 1.5653104592186808
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.06it/s, loss=-0.000292, elapsed time=0.08, total time=10.2]
[I 2025-06-07 22:16:57,476] Trial 86 finished with value: -0.00029210693510890886 and parameters: {'learning_rate': 0.011333197531916332, 'sigma_multiplier': 1.7593152222219806, 'num_layers': 5, 'initialization_multiplier': 1.5653104592186808}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 86 final loss: -0.00029211
Trial 87:
  Learning Rate: 0.01460866177072218
  Sigma Multiplier: 1.8546197752710856
  Initialization Multiplier: 1.8360682485005075
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.08it/s, loss=-0.000210, elapsed time=0.06, total time=10.3]
[I 2025-06-07 22:17:07,804] Trial 87 finished with value: -0.00021017903000380102 and parameters: {'learning_rate': 0.01460866177072218, 'sigma_multiplier': 1.8546197752710856, 'num_layers': 5, 'initialization_multiplier': 1.8360682485005075}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 87 final loss: -0.00021018
Trial 88:
  Learning Rate: 0.008839402113420549
  Sigma Multiplier: 1.6185802014218522
  Initialization Multiplier: 1.0377774729905334
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.32it/s, loss=-0.000109, elapsed time=0.06, total time=10]  
[I 2025-06-07 22:17:17,896] Trial 88 finished with value: -0.00010940208829397597 and parameters: {'learning_rate': 0.008839402113420549, 'sigma_multiplier': 1.6185802014218522, 'num_layers': 5, 'initialization_multiplier': 1.0377774729905334}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 88 final loss: -0.00010940
Trial 89:
  Learning Rate: 0.003061880812862843
  Sigma Multiplier: 1.4973153299765996
  Initialization Multiplier: 1.962186946139384
  Number of Layers: 2


Training Progress: 100%|██████████| 150/150 [00:06<00:00, 22.33it/s, loss=0.009076, elapsed time=0.07, total time=6.99]
[I 2025-06-07 22:17:24,927] Trial 89 finished with value: 0.009076494783371853 and parameters: {'learning_rate': 0.003061880812862843, 'sigma_multiplier': 1.4973153299765996, 'num_layers': 2, 'initialization_multiplier': 1.962186946139384}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 89 final loss: 0.00907649
Trial 90:
  Learning Rate: 0.005233344187450868
  Sigma Multiplier: 0.338549680935055
  Initialization Multiplier: 1.4108007670200298
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:13<00:00, 11.29it/s, loss=0.002600, elapsed time=0.08, total time=13.6]
[I 2025-06-07 22:17:38,543] Trial 90 finished with value: 0.0026001362244346695 and parameters: {'learning_rate': 0.005233344187450868, 'sigma_multiplier': 0.338549680935055, 'num_layers': 5, 'initialization_multiplier': 1.4108007670200298}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 90 final loss: 0.00260014
Trial 91:
  Learning Rate: 0.010292092154055426
  Sigma Multiplier: 1.8079910055272683
  Initialization Multiplier: 1.5069444319463874
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:09<00:00, 15.86it/s, loss=-0.000294, elapsed time=0.05, total time=9.74]
[I 2025-06-07 22:17:48,338] Trial 91 finished with value: -0.000293862383262655 and parameters: {'learning_rate': 0.010292092154055426, 'sigma_multiplier': 1.8079910055272683, 'num_layers': 5, 'initialization_multiplier': 1.5069444319463874}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 91 final loss: -0.00029386
Trial 92:
  Learning Rate: 0.0194437819874175
  Sigma Multiplier: 1.7176047353496346
  Initialization Multiplier: 1.6211645381378188
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 17.51it/s, loss=-0.000168, elapsed time=0.04, total time=8.87]
[I 2025-06-07 22:17:57,255] Trial 92 finished with value: -0.00016789059299597532 and parameters: {'learning_rate': 0.0194437819874175, 'sigma_multiplier': 1.7176047353496346, 'num_layers': 5, 'initialization_multiplier': 1.6211645381378188}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 92 final loss: -0.00016789
Trial 93:
  Learning Rate: 0.01496360529658561
  Sigma Multiplier: 1.9066069024835979
  Initialization Multiplier: 1.212010380558872
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 20.02it/s, loss=-0.000396, elapsed time=0.05, total time=7.74]
[I 2025-06-07 22:18:05,076] Trial 93 finished with value: -0.0003955664034844372 and parameters: {'learning_rate': 0.01496360529658561, 'sigma_multiplier': 1.9066069024835979, 'num_layers': 5, 'initialization_multiplier': 1.212010380558872}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 93 final loss: -0.00039557
Trial 94:
  Learning Rate: 0.031700896748372204
  Sigma Multiplier: 1.9322530521031993
  Initialization Multiplier: 1.1805464259438363
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 21.26it/s, loss=-0.000209, elapsed time=0.05, total time=7.28]
[I 2025-06-07 22:18:12,414] Trial 94 finished with value: -0.00020856526813746608 and parameters: {'learning_rate': 0.031700896748372204, 'sigma_multiplier': 1.9322530521031993, 'num_layers': 5, 'initialization_multiplier': 1.1805464259438363}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 94 final loss: -0.00020857
Trial 95:
  Learning Rate: 0.01518199254419617
  Sigma Multiplier: 1.8922927344055653
  Initialization Multiplier: 1.3340080418830602
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 19.39it/s, loss=-0.000180, elapsed time=0.05, total time=7.99]
[I 2025-06-07 22:18:20,453] Trial 95 finished with value: -0.00017963553966033217 and parameters: {'learning_rate': 0.01518199254419617, 'sigma_multiplier': 1.8922927344055653, 'num_layers': 5, 'initialization_multiplier': 1.3340080418830602}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 95 final loss: -0.00017964
Trial 96:
  Learning Rate: 0.04577754279697202
  Sigma Multiplier: 1.6788621801292047
  Initialization Multiplier: 1.264583366182922
  Number of Layers: 4


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 20.24it/s, loss=-0.000225, elapsed time=0.04, total time=7.64]
[I 2025-06-07 22:18:28,136] Trial 96 finished with value: -0.00022525856455140898 and parameters: {'learning_rate': 0.04577754279697202, 'sigma_multiplier': 1.6788621801292047, 'num_layers': 4, 'initialization_multiplier': 1.264583366182922}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 96 final loss: -0.00022526
Trial 97:
  Learning Rate: 0.07112085518583944
  Sigma Multiplier: 1.7910397233665916
  Initialization Multiplier: 1.9171034270232459
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 18.81it/s, loss=-0.000074, elapsed time=0.06, total time=8.22]
[I 2025-06-07 22:18:36,430] Trial 97 finished with value: -7.423620188887881e-05 and parameters: {'learning_rate': 0.07112085518583944, 'sigma_multiplier': 1.7910397233665916, 'num_layers': 5, 'initialization_multiplier': 1.9171034270232459}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 97 final loss: -0.00007424
Trial 98:
  Learning Rate: 0.012753772325256147
  Sigma Multiplier: 1.8427960823750733
  Initialization Multiplier: 1.1920639091870442
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:08<00:00, 18.14it/s, loss=-0.000380, elapsed time=0.05, total time=8.54]
[I 2025-06-07 22:18:45,018] Trial 98 finished with value: -0.00037953682128703787 and parameters: {'learning_rate': 0.012753772325256147, 'sigma_multiplier': 1.8427960823750733, 'num_layers': 5, 'initialization_multiplier': 1.1920639091870442}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 98 final loss: -0.00037954
Trial 99:
  Learning Rate: 0.0242490421154761
  Sigma Multiplier: 1.8297819909944701
  Initialization Multiplier: 1.2113810527126294
  Number of Layers: 5


Training Progress: 100%|██████████| 150/150 [00:07<00:00, 19.74it/s, loss=-0.000193, elapsed time=0.05, total time=7.85]
[I 2025-06-07 22:18:52,930] Trial 99 finished with value: -0.0001930098887073218 and parameters: {'learning_rate': 0.0242490421154761, 'sigma_multiplier': 1.8297819909944701, 'num_layers': 5, 'initialization_multiplier': 1.2113810527126294}. Best is trial 37 with value: -0.0005842494105895364.


Training has not converged after 150 steps
Trial 99 final loss: -0.00019301


In [33]:
best_hyperparams = study.best_params
best_loss_value = study.best_value

print("\nOptimization Finished!")
print(f"Best hyperparameters found: {best_hyperparams}")
print(f"Best loss value: {best_loss_value}")


Optimization Finished!
Best hyperparameters found: {'learning_rate': 0.012529922603919507, 'sigma_multiplier': 1.4402562057733146, 'num_layers': 5, 'initialization_multiplier': 1.9680596739001786}
Best loss value: -0.0005842494105895364


In [34]:
LR = best_hyperparams['learning_rate']
SIGMA_M = best_hyperparams['sigma_multiplier']
NUM_LAYERS = best_hyperparams['num_layers']
INIT_M = best_hyperparams['initialization_multiplier']

In [35]:
def train_on_dataset(dataset=train_ds):
    grid_conn= aachen_connectivity()
    num_qubits = NODES * (NODES - 1) // 2
    gates = efficient_connectivity_gates(grid_conn, num_qubits, NUM_LAYERS)
    
    circuit = iqp.IqpSimulator(num_qubits, gates, device="lightning.qubit")
    
    initial_params = initialize_from_data(gates, dataset) * INIT_M
    loss = iqp.gen_qml.mmd_loss_iqp
    learning_rate = LR
    sigma = median_heuristic(dataset) * SIGMA_M
    
    loss_kwarg = {
        "params": initial_params,
        "iqp_circuit": circuit,
        "ground_truth": dataset,
        "sigma": [sigma],
        "n_ops": 2000,
        "n_samples": 2000,
        "key": jax.random.PRNGKey(42),
    }
    
    trainer = iqp.Trainer("Adam", loss, stepsize=learning_rate)
    trainer.train(n_iters= 2000,loss_kwargs=loss_kwarg, turbo=1)
    
    return trainer.final_params

In [36]:
params = train_on_dataset(train_ds)

Training Progress: 100%|██████████| 2000/2000 [01:41<00:00, 19.76it/s, loss=-0.000174, elapsed time=0.04, total time=101] 

Training has not converged after 2000 steps





In [37]:
import numpy as np
np.save(f'./results/params/params_{NODES}N_{TYPE}_{CONN}_LR{LR}_SIGMA{SIGMA_M}_INIT{INIT_M}_MAX_WEIGHT{NUM_LAYERS}.npy', params)

In [38]:
f'./results/params/params_{NODES}N_{TYPE}_{CONN}_LR{LR}_SIGMA{SIGMA_M}_INIT{INIT_M}_NUMLAYERS{NUM_LAYERS}.npy'

'./results/params/params_8N_Bipartite_Medium_LR0.012529922603919507_SIGMA1.4402562057733146_INIT1.9680596739001786_NUMLAYERS5.npy'