In [1]:
def make_env(scenario_name, benchmark=False):
    '''
    Creates a MultiAgentEnv object as env. This can be used similar to a gym
    environment by calling env.reset() and env.step().
    Use env.render() to view the environment on the screen.
    Input:
        scenario_name   :   name of the scenario from ./scenarios/ to be Returns
                            (without the .py extension)
        benchmark       :   whether you want to produce benchmarking data
                            (usually only done during evaluation)
    Some useful env properties (see environment.py):
        .observation_space  :   Returns the observation space for each agent
        .action_space       :   Returns the action space for each agent
        .n                  :   Returns the number of Agents
    '''
    from multiagent.environment import MultiAgentEnv
    import multiagent.scenarios as scenarios

    # load scenario from script
    scenario = scenarios.load(scenario_name + ".py").Scenario()
    # create world
    world = scenario.make_world()
    # create multiagent environment
    if benchmark:        
        env = MultiAgentEnv(world, scenario.reset_world, scenario.reward, scenario.observation, scenario.benchmark_data)
    else:
        env = MultiAgentEnv(world, scenario.reset_world, scenario.reward, scenario.observation)
    return env

In [2]:
env = make_env("simple_push")

In [3]:
env.reset()

[array([ 0.        ,  0.        ,  0.52995598,  0.05620819, -1.27963675,
         1.42135011, -0.37783193,  1.36780179]),
 array([ 0.        ,  0.        ,  0.9077879 , -1.31159361,  0.25      ,
         0.75      ,  0.25      ,  0.9077879 , -1.31159361, -0.90180482,
         0.05354832,  0.1       ,  0.9       ,  0.1       ,  0.1       ,
         0.1       ,  0.9       ,  0.37783193, -1.36780179])]

In [4]:
env.action_space

[Discrete(5), Discrete(5)]

In [5]:
env.observation_space

[Box(-inf, inf, (8,), float32), Box(-inf, inf, (19,), float32)]

In [6]:
env.reward_range

(-inf, inf)

In [7]:
env.n

2

In [10]:
len(env.observation_space)

2