attention network work

ADGEfficiency · Jun 3, 2021 · d3a7752 · d3a7752
1 parent fb6973b
commit d3a7752
Show file tree

Hide file tree

Showing 2 changed files with 38 additions and 3 deletions.
diff --git a/energypy/agent/qfunc.py b/energypy/agent/qfunc.py
@@ -38,9 +38,9 @@ def make_qfunc(obs_shape, n_actions, name, size_scale=1):
     # if hyp.get('q-net') == 'attention':
     # TODO
     if False:
-        inputs, net = attention(obs_shape, 1, size_scale)
+        _, net = attention(obs_shape, 1, size_scale)
     else:
-        inputs, net = dense(inputs, 1, size_scale)
+        _, net = dense(inputs, 1, size_scale)
 
     return keras.Model(
         inputs=[in_obs, in_act],

diff --git a/energypy/train.py b/energypy/train.py
@@ -1,7 +1,14 @@
 from energypy import utils, qfunc, policy, target, alpha
 
 
-def train(
+def train(*args, **kwargs):
+    if 'network' in kwargs.keys():
+        raise NotImplementedError()
+    else:
+        return train_one_head_network(*args, **kwargs)
+
+
+def train_one_head_network(
     batch,
     actor,
     onlines,
@@ -61,3 +68,31 @@ def train(
     counters['alpha-update-seconds'] += utils.now() - st
     counters['train-seconds'] += utils.now() - st
     counters['train-steps'] += 1
+
+
+def train_multi_head_network(
+    batch,
+    network,
+    log_alpha,
+    writer,
+    optimizers,
+    counters,
+    hyp
+):
+    st = utils.now()
+    #  train net
+
+
+
+    #  maybe do the actor fwd pass here...
+    st = utils.now()
+    alpha.update(
+        batch,
+        actor,
+        log_alpha,
+        hyp,
+        optimizers['alpha'],
+        counters,
+        writer
+    )
+    counters['alpha-update-seconds'] += utils.now() - st