diff --git a/reinforcement_learning/reinforce.py b/reinforcement_learning/reinforce.py index 8c8ff485f6..77a733c702 100644 --- a/reinforcement_learning/reinforce.py +++ b/reinforcement_learning/reinforce.py @@ -15,10 +15,10 @@ parser.add_argument('--gamma', type=float, default=0.99, metavar='G', help='discount factor (default: 0.99)') parser.add_argument('--seed', type=int, default=543, metavar='N', - help='random seed (default: 1)') + help='random seed (default: 543)') parser.add_argument('--render', action='store_true', help='render the environment') -parser.add_argument('--log-interval', type=int, default=10, metavar='N', +parser.add_argument('--log_interval', type=int, default=10, metavar='N', help='interval between training status logs (default: 10)') args = parser.parse_args() @@ -57,7 +57,6 @@ def select_action(state): def finish_episode(): R = 0 - saved_actions = model.saved_actions rewards = [] for r in model.rewards[::-1]: R = r + args.gamma * R