diff --git a/python/ppo.py b/python/ppo.py index f755f96fdb..8a4a879e40 100755 --- a/python/ppo.py +++ b/python/ppo.py @@ -32,6 +32,7 @@ --hidden-units= Number of units in hidden layer [default: 64]. --batch-size= How many experiences per gradient descent update step [default: 64]. --keep-checkpoints= How many model checkpoints to keep [default: 5]. + --worker-id= Number to add to communication port (5005). Used for asynchronous agent scenarios [default: 0]. ''' options = docopt(_USAGE) @@ -47,6 +48,7 @@ save_freq = int(options['--save-freq']) env_name = options[''] keep_checkpoints = int(options['--keep-checkpoints']) +worker_id = int(options['--worker-id']) # Algorithm-specific parameters for tuning gamma = float(options['--gamma']) @@ -60,7 +62,7 @@ hidden_units = int(options['--hidden-units']) batch_size = int(options['--batch-size']) -env = UnityEnvironment(file_name=env_name) +env = UnityEnvironment(file_name=env_name, worker_id=worker_id) print(str(env)) brain_name = env.brain_names[0]