From b78e36ce6c88ba0369714a0d5ada03491708c5a7 Mon Sep 17 00:00:00 2001 From: Ruoyu Gao Date: Tue, 20 Jun 2023 00:57:57 -0400 Subject: [PATCH] fix style for icm --- ding/reward_model/icm_reward_model.py | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/ding/reward_model/icm_reward_model.py b/ding/reward_model/icm_reward_model.py index f277791bb6..d988a1aed5 100644 --- a/ding/reward_model/icm_reward_model.py +++ b/ding/reward_model/icm_reward_model.py @@ -51,11 +51,11 @@ class ICMRewardModel(BaseRewardModel): 7 | ``residual_num`` int 4 | the residual number of residual net | 8 | ``hidden`` list [64, 64, | the MLP layer shape | | ``_size_list`` (int) 128] | | - 9 | ``inverse_`` int 512 | the inverse model hidden size | + 9 | ``inverse_`` int 512 | the inverse model hidden size | | ``hidden_size`` | | - 10 | ``update_per_`` int 100 | Number of updates per collect | + 10 | ``update_per_`` int 100 | Number of updates per collect | | ``collect`` | | - 11 | ``reverse_loss`` float 1 | the importance weight of the | + 11 | ``reverse_loss`` float 1 | the importance weight of the | ``_weight`` | forward and reverse loss | 12 | ``intrinsic_`` float 0.003 | the weight of intrinsic reward | r = w*r_i + r_e ``reward_weight``