From 74e051c45e91c3fa552aaddf8eee4c3953d8ea02 Mon Sep 17 00:00:00 2001 From: ffelten Date: Fri, 3 May 2024 09:51:27 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Farama-F?= =?UTF-8?q?oundation/momaland@6cd8323a9e80ad3809d1051f3b2ed385f54bad6d=20?= =?UTF-8?q?=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .buildinfo | 2 +- 404.html | 3 +- README/index.html | 3 +- _modules/index.html | 3 +- .../momaland/utils/aec_wrappers/index.html | 3 +- .../momaland/utils/conversions/index.html | 3 +- _modules/momaland/utils/env/index.html | 3 +- .../utils/parallel_wrappers/index.html | 3 +- _static/documentation_options.js | 2 +- api/aec/index.html | 13 ++-- api/parallel/index.html | 7 +- api/wrappers/index.html | 3 +- environments/all-envs/index.html | 64 +++++++++--------- environments/catch/index.html | 3 +- environments/escort/index.html | 3 +- environments/mobeach/index.html | 3 +- environments/mobreakthrough/index.html | 3 +- environments/mocongestion/index.html | 3 +- environments/moconnect4/index.html | 3 +- environments/mogem_mining/index.html | 3 +- environments/moingenious/index.html | 3 +- environments/moitem_gathering/index.html | 9 ++- .../momultiwalker_stability/index.html | 5 +- environments/mopistonball/index.html | 3 +- environments/mosame_game/index.html | 3 +- environments/surround/index.html | 3 +- genindex/index.html | 3 +- index.html | 13 ++-- introduction/install/index.html | 3 +- objects.inv | Bin 1092 -> 1073 bytes release_notes/index.html | 42 +++++++++++- search/index.html | 3 +- searchindex.js | 2 +- tutorials/custom_env/index.html | 3 +- tutorials/learning_algorithms/index.html | 27 +++++++- 35 files changed, 145 insertions(+), 110 deletions(-) diff --git a/.buildinfo b/.buildinfo index dbfc632f..5622ad99 100644 --- a/.buildinfo +++ b/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: 7ceb4aaaefed7bfb4d66af48c1aae153 +config: 63a8af9b3368f5f776b1597bc8fb05ae tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/404.html b/404.html index 9248375a..1edf908e 100644 --- a/404.html +++ b/404.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -397,7 +396,7 @@

    The requested page could not be found. + diff --git a/README/index.html b/README/index.html index e5bacc29..f8b075e1 100644 --- a/README/index.html +++ b/README/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -414,7 +413,7 @@

    Build the Documentation + diff --git a/_modules/index.html b/_modules/index.html index 8aabb499..a6f9d11c 100644 --- a/_modules/index.html +++ b/_modules/index.html @@ -231,7 +231,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -367,7 +366,7 @@

    All modules for which code is available

    - + diff --git a/_modules/momaland/utils/aec_wrappers/index.html b/_modules/momaland/utils/aec_wrappers/index.html index 80930a74..2d79d863 100644 --- a/_modules/momaland/utils/aec_wrappers/index.html +++ b/_modules/momaland/utils/aec_wrappers/index.html @@ -231,7 +231,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -506,7 +505,7 @@

    Source code for momaland.utils.aec_wrappers

         
         
     
    -    
    +    
         
         
         
    diff --git a/_modules/momaland/utils/conversions/index.html b/_modules/momaland/utils/conversions/index.html
    index f915333d..4042d354 100644
    --- a/_modules/momaland/utils/conversions/index.html
    +++ b/_modules/momaland/utils/conversions/index.html
    @@ -231,7 +231,6 @@
     
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -538,7 +537,7 @@

    Source code for momaland.utils.conversions

         
         
     
    -    
    +    
         
         
         
    diff --git a/_modules/momaland/utils/env/index.html b/_modules/momaland/utils/env/index.html
    index bd77b6c3..d10bb539 100644
    --- a/_modules/momaland/utils/env/index.html
    +++ b/_modules/momaland/utils/env/index.html
    @@ -231,7 +231,6 @@
     
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -432,7 +431,7 @@

    Source code for momaland.utils.env

         
         
     
    -    
    +    
         
         
         
    diff --git a/_modules/momaland/utils/parallel_wrappers/index.html b/_modules/momaland/utils/parallel_wrappers/index.html
    index d9cbdc46..0c5b2f7c 100644
    --- a/_modules/momaland/utils/parallel_wrappers/index.html
    +++ b/_modules/momaland/utils/parallel_wrappers/index.html
    @@ -231,7 +231,6 @@
     
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -597,7 +596,7 @@

    Source code for momaland.utils.parallel_wrappers

    - + diff --git a/_static/documentation_options.js b/_static/documentation_options.js index c77075b8..aa5dbb33 100644 --- a/_static/documentation_options.js +++ b/_static/documentation_options.js @@ -1,5 +1,5 @@ const DOCUMENTATION_OPTIONS = { - VERSION: '0.0.2', + VERSION: '0.1.0', LANGUAGE: 'en', COLLAPSE_INDEX: false, BUILDER: 'dirhtml', diff --git a/api/aec/index.html b/api/aec/index.html index d6e62f27..cecc1d59 100644 --- a/api/aec/index.html +++ b/api/aec/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -311,8 +310,8 @@

    AEC

    Usage

    -

    Similar to PettingZoo, the MOMAland API models environments as simple Python env classes. Creating environment instances and interacting with them is very simple - here’s an example using the “momultiwalker_v0” environment:

    -
    from momaland.envs.momultiwalker import momultiwalker_v0 as _env
    +

    Similar to PettingZoo, the MOMAland API models environments as simple Python env classes. Creating environment instances and interacting with them is very simple - here’s an example using the “momultiwalker_stability_v0” environment:

    +
    from momaland.envs.momultiwalker_stability import momultiwalker_stability_v0 as _env
     import numpy as np
     
     # .env() function will return an AEC environment, as per PZ standard
    @@ -335,9 +334,9 @@ 

    Usage # Making the vector reward a scalar reward to shift to single-objective multi-agent (aka PettingZoo) # We can assign different weights to the objectives of each agent. weights = { - "walker_0": np.array([0.1, 0.7, 0.2]), - "walker_1": np.array([0.6, 0.1, 0.3]), - "walker_2": np.array([0.2, 0.2, 0.6]), + "walker_0": np.array([0.7, 0.3]), + "walker_1": np.array([0.5, 0.5]), + "walker_2": np.array([0.2, 0.8]), } env = LinearizeReward(env, weights)

    @@ -677,7 +676,7 @@

    Methods¶ - + diff --git a/api/parallel/index.html b/api/parallel/index.html index 97e17205..65c9d63b 100644 --- a/api/parallel/index.html +++ b/api/parallel/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -312,13 +311,13 @@

    Parallel

    Usage

    Parallel environments can be interacted with as follows:

    -
    from momaland.envs.momultiwalker import momultiwalker_v0 as _env
    +
    from momaland.envs.momultiwalker_stability import momultiwalker_stability_v0 as _env
     
     # .parallel_env() function will return a Parallel environment, as per PZ standard
     parallel_env = _env.parallel_env(render_mode="human")
     
     # optionally, you can scalarize the reward with weights
    -parallel_env = momaland.LinearReward(parallel_env, weight=np.array([0.6, 0.2, 0.2]))
    +parallel_env = momaland.LinearReward(parallel_env, weight=np.array([0.7, 0.3]))
     
     observations, infos = parallel_env.reset(seed=42)
     while parallel_env.agents:
    @@ -621,7 +620,7 @@ 

    Methods¶ - + diff --git a/api/wrappers/index.html b/api/wrappers/index.html index 2957d117..39dccc99 100644 --- a/api/wrappers/index.html +++ b/api/wrappers/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -585,7 +584,7 @@

    Parallel - + diff --git a/environments/all-envs/index.html b/environments/all-envs/index.html index 49cb3ae2..ea3e7852 100644 --- a/environments/all-envs/index.html +++ b/environments/all-envs/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -311,7 +310,8 @@

    All Environments

    -

    MOMAland includes environments taken from the MO/MARL literature, as well as multi-objective versions of environments from PettingZoo.

    +

    MOMAland includes environments taken from the MO/MARL literature, as well as multi-objective versions of environments from PettingZoo. +More information are available in the TODO MOMAland paper.

    @@ -342,64 +342,64 @@

    All Environments

    - + - - + + - + - - + + - + - - + + - - + + - + - - + + - + - - + + - - + + - + - - + + - - - + + + - + - - + +

    mo-beach-v0

    Any

    Continuous / Discrete

    [TODO]

    TODO

    [occupation, mixture]

    Taken from Mannion_2018. MO-Beach is a game with two objectives, reflecting the enjoyment of tourists (agents) on their respective beach sections in terms of crowdedness and diversity of attendees. Each beach section is characterised by a capacity and each agent is characterised by a type.

    mo-breakthrough-v0

    Adversarial

    Discrete / Discrete

    [TODO]

    TODO

    [win, fast win, capturing opponent's pieces, avoiding capture]

    Multi-objective version of the two-player, turn-based, board game Breakthrough.

    mo-congestion-v0

    Mixed

    Continuous / Discrete

    [TODO]

    TODO

    [travel time, cost]

    MO-RouteChoice is a multi-objective extension of the route choice problem Thomasini_2023, where a number of self-interested drivers (agents) must navigate a road network.

    mo-connect4-v0

    Adversarial

    Discrete / Discrete

    [TODO]

    TODO

    [win, fast win, [column #n]]

    MO version of Connect 4. Additional objectives are fast win and optionally one objective per column.

    mo-gem-mining-v0

    Cooperative

    Continuous / Discrete

    [TODO]

    TODO

    [#gems] (configurable)

    MO version of Gem Mining Bargiacchi_2018. Agents go to different mines to extract different gems (objectives). There are restrictions on which mines can be reached for each agent. Agents also influence each other’s producitivity.

    mo-ingenious-v0

    Any

    Discrete / Discrete

    [TODO]

    TODO

    [#colors] (configurable)

    MO adaptation of the zero-sum, turn-based board game Ingenious. The game’s original rules support 2-4 players collecting scores in multiple colors (objectives), with the goal of winning by maximizing the minimum score over all colors.

    mo-item-gathering-v0

    Adversarial

    Discrete / Discrete

    [TODO]

    TODO

    [#objects] (configurable)

    Adapted from Kallstrom_2019, is a multi-agent grid world, containing items of different colours. Each colour represents a different objective and the goal of the agents is to collect as many objects as possible.

    mo-multiwalker-v0

    mo-multiwalker-stability-v0

    Cooperative

    Continuous / Continuous

    [TODO]

    TODO

    [progress right, package stability]

    A MO version of PZ’s MultiWalker introduced in Gupta_2017, where the agents also seek to keep the package steady.

    mo-pistonball-v0

    Cooperative

    TODO / TODO

    [TODO]

    TODO

    Continuous / Any

    [agent_#n_reward] (configurable)

    An MO version of PZ’s Pistonball where the reward of each agent is kept separate.

    mo-same-game-v0

    Any

    Discrete / Discrete

    [TODO]

    TODO

    [colors_n] (configurable)

    MO-SameGame is a multi-objective, multi-agent variant of the single-player, single-objective turn-based puzzle game called SameGame Baier_2015. The original single-player, single-objective SameGame rewards the player with \(n^2\) points for removing any group of n tiles. MO-SameGame can extend this in two ways. Agents can either only get points for their own actions, leading to competition between them, or all rewards can be shared in ``team reward’’ mode. Additionally, points for every colour can be counted as separate objectives, allowing for different trade-offs between colours, or they can be accumulated in a single objective like in the default game variant, essentially providing a single-objective wrapper for the game.

    @@ -480,10 +480,12 @@

    All Environments + + + + diff --git a/environments/escort/index.html b/environments/escort/index.html index 0db5a7c1..51381b51 100644 --- a/environments/escort/index.html +++ b/environments/escort/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -492,7 +491,7 @@

    Credits¶ - + diff --git a/environments/mobeach/index.html b/environments/mobeach/index.html index 25e149fa..10c1479e 100644 --- a/environments/mobeach/index.html +++ b/environments/mobeach/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -483,7 +482,7 @@

    Arguments + diff --git a/environments/mobreakthrough/index.html b/environments/mobreakthrough/index.html index 3143cf1e..786ed26f 100644 --- a/environments/mobreakthrough/index.html +++ b/environments/mobreakthrough/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -485,7 +484,7 @@

    Version History + diff --git a/environments/mocongestion/index.html b/environments/mocongestion/index.html index 5b5d50e8..32c29874 100644 --- a/environments/mocongestion/index.html +++ b/environments/mocongestion/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -476,7 +475,7 @@

    Credits¶ - + diff --git a/environments/moconnect4/index.html b/environments/moconnect4/index.html index 4b66dc34..d9bf1282 100644 --- a/environments/moconnect4/index.html +++ b/environments/moconnect4/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -489,7 +488,7 @@

    Version History + diff --git a/environments/mogem_mining/index.html b/environments/mogem_mining/index.html index db5d439d..aabb4c3e 100644 --- a/environments/mogem_mining/index.html +++ b/environments/mogem_mining/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -483,7 +482,7 @@

    Credits¶ - + diff --git a/environments/moingenious/index.html b/environments/moingenious/index.html index 3556413d..7917a232 100644 --- a/environments/moingenious/index.html +++ b/environments/moingenious/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -403,7 +402,7 @@

    MO-Ingenious + diff --git a/environments/moitem_gathering/index.html b/environments/moitem_gathering/index.html index 4e9e3865..6a8f0fdb 100644 --- a/environments/moitem_gathering/index.html +++ b/environments/moitem_gathering/index.html @@ -8,7 +8,7 @@ - + @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -379,12 +378,12 @@

    Arguments - +
    Next
    -
    MO-Multiwalker
    +
    MO-MultiwalkerStability
    @@ -473,7 +472,7 @@

    Arguments + diff --git a/environments/momultiwalker_stability/index.html b/environments/momultiwalker_stability/index.html index 4e8e70a6..bbebfb85 100644 --- a/environments/momultiwalker_stability/index.html +++ b/environments/momultiwalker_stability/index.html @@ -8,7 +8,7 @@ - + @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -463,7 +462,7 @@

    Arguments + diff --git a/environments/mopistonball/index.html b/environments/mopistonball/index.html index eb419b3b..327597ea 100644 --- a/environments/mopistonball/index.html +++ b/environments/mopistonball/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -480,7 +479,7 @@

    Credits¶ - + diff --git a/environments/mosame_game/index.html b/environments/mosame_game/index.html index 0361de73..c69cbdcb 100644 --- a/environments/mosame_game/index.html +++ b/environments/mosame_game/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -489,7 +488,7 @@

    Version History + diff --git a/environments/surround/index.html b/environments/surround/index.html index 73646d23..cefafb73 100644 --- a/environments/surround/index.html +++ b/environments/surround/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -490,7 +489,7 @@

    Credits¶ - + diff --git a/genindex/index.html b/genindex/index.html index cde2df65..cb234ff9 100644 --- a/genindex/index.html +++ b/genindex/index.html @@ -230,7 +230,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -588,7 +587,7 @@

    T

    - + diff --git a/index.html b/index.html index 3031a2c3..ac2c943d 100644 --- a/index.html +++ b/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -333,8 +332,8 @@

    The documentation website is at https://momaland.farama.org/, and we have a public discord server (which we also use to coordinate development work) that you can join here.

    API

    -

    Similar to PettingZoo, the MOMAland API models environments as simple Python env classes. Creating environment instances and interacting with them is very simple - here’s an example using the “momultiwalker_v0” environment:

    -
    from momaland.envs.momultiwalker import momultiwalker_v0 as _env
    +

    Similar to PettingZoo, the MOMAland API models environments as simple Python env classes. Creating environment instances and interacting with them is very simple - here’s an example using the “momultiwalker_stability_v0” environment:

    +
    from momaland.envs.momultiwalker_stability import momultiwalker_stability_v0 as _env
     import numpy as np
     
     # .env() function will return an AEC environment, as per PZ standard
    @@ -357,9 +356,9 @@ 

    API

    # Making the vector reward a scalar reward to shift to single-objective multi-agent (aka PettingZoo) # We can assign different weights to the objectives of each agent. weights = { - "walker_0": np.array([0.1, 0.7, 0.2]), - "walker_1": np.array([0.6, 0.1, 0.3]), - "walker_2": np.array([0.2, 0.2, 0.6]), + "walker_0": np.array([0.7, 0.3]), + "walker_1": np.array([0.5, 0.5]), + "walker_2": np.array([0.2, 0.8]), } env = LinearizeReward(env, weights)
    @@ -452,7 +451,7 @@

    Citing + diff --git a/introduction/install/index.html b/introduction/install/index.html index 69db84be..b699b74b 100644 --- a/introduction/install/index.html +++ b/introduction/install/index.html @@ -232,7 +232,6 @@
  • MO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -396,7 +395,7 @@

    Install¶ - + diff --git a/objects.inv b/objects.inv index fc5248e93291a97683c59bbd1dceb731ace5e4dc..0ebd9f48c973a76174ff44881f6ffef3a5dc7ca9 100644 GIT binary patch delta 967 zcmV;&133J|2(bu|cz;W8qc9MF@B9i&-D|>D>Z!MGH(OO|+NjlPkH~@9#Ht_2Hht`` z-?4!Nh@k~~Xan>3W<0jXMkql!mD#eejGHBeG2Iqp|%F}3!S?xPB3#bnwUqfjA2_2bIYPZX65D_pMwSi zcB-rETyrL(Nq?9#d`Fq?Z!F}~^0%M`lYSvh4{voL)2WP2)u;nKw(jAd^B(TDGg!ev zjpg<3kCC8o4;=~lxF3!LekttZ9yu5I683-OCQM3A8 zqrRt20kjS6f!sYYZ6)M70D&2bzPPZ5eeQ<3st)$D<#9kktvFsen(b8bx z1qxc>f`0}$AkN9Ep^8pJ^is+M$hG@v`+>n3wY`p|IwmXs+jbRd3v?i8rFXNp_~D*T z+%?c=yVt7N4N@9rC9EOnGVyzD2gZMn^b?Opo_BqC4bUWh+*}N^yh%;+FI~tN$ixAofz%70?a9kqMV!@0E$ODKwNYDpI?3U1je z<39F078b9n923>AQ56)*rh*m%|x zKHT76n`8>DU0>_P)CMtms-B|8b_}=tdB>}TY}ZKx2WlXZ%0jCvv=lLU zEMMJ`3nnsn&FCImr3@EjsdEQ()LO^k!9W~Vai2*e1Gcz<7Sn=lZ--}w}ly4QqN>eJr3E~_dvThwaWBXZ!DSoI%dn|9r& z-`PMg1ZaUiw87`Q-<^;1*$5>lr!rd?mT|MDkR~sh<~eAyzGo7sX8+&;UZ~DU{`w{5 z)EII}XwKqVFTVIhR*@J1{ZJYw=YdispK*>UY1Tp|j%!ttQ-4i42VVPFf;_QoiJyZ6 z`Mlo#yx!bwpr7f|vN*#mjc8^ZxiW_BIV??!2AP$cb9xLK z4A{A*u5&GU5q}|J$?_d#zP+)K&x_xJ7EJm=n(yA~LZ)*WyQ)$5^w_$Gzt4KS+b&@B zE@~=oaDPk$_4m+;khlBcMBsfhI5~!81K+t94_u2uB{~Q@6HcFm%a~k&0B!1jnjkCN;P4a^-=KvzX z3lWot5mKY%S+^jze$<7b2qaU58DX7tJnF6oxFywR zz~l)Sft_?b>k%Jr@vluXh1RZ74q|GBm^@ZbQLw-JdsDT;tLEhD1g{H!+Xl5XCU@>9 zYJXI!D9H8h4y9JBtngRdm`TifJAHlgj_4nv&SvWmHrQ^}ftB@yo4>B=3Ct$C+`rKQKFmJ_HL(y*_IPOZpvr>4J1-oXmzO8L`)vap*#M;L{kQ@Jl!L-lwmEGbMCSbwYEV2VosZ&Drs9- zr5WXT3KqCXk)U=MSKmCA4SjO2n35YW3{T#Gh)d9}MJJRWP-Kt7^rL$eV{%^!Nh6H@ I0~!^oWl%TeMO-GemMining
  • MO-Ingenious
  • MO-ItemGathering
  • -
  • MO-Multiwalker
  • MO-MultiwalkerStability
  • MO-Pistonball
  • MO-SameGame
  • @@ -309,6 +308,44 @@

    Release Notes

    +
    +

    0.1.0

    +

    Released on 2024-05-03 - GitHub - PyPI

    +

    What's Changed

    + +

    New Contributors

    + +

    Full Changelog: v0.0.2...0.1.0

    v0.0.2: Dummy release 2

    Released on 2023-12-20 - GitHub - PyPI

    @@ -367,6 +404,7 @@

    v0.0.1: Dummy release
    • Release Notes @@ -403,7 +441,7 @@

      v0.0.1: Dummy release + diff --git a/search/index.html b/search/index.html index daa74c0d..bad64ca1 100644 --- a/search/index.html +++ b/search/index.html @@ -229,7 +229,6 @@
    • MO-GemMining
    • MO-Ingenious
    • MO-ItemGathering
    • -
    • MO-Multiwalker
    • MO-MultiwalkerStability
    • MO-Pistonball
    • MO-SameGame
    • @@ -371,7 +370,7 @@ - + diff --git a/searchindex.js b/searchindex.js index 7a25782c..a249743b 100644 --- a/searchindex.js +++ b/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "AEC": [[2, "aec"], [4, "aec"]], "AEC to Parallel": [[4, "aec-to-parallel"]], "API": [[20, "api"]], "Action Space": [[6, "action-space"], [7, "action-space"], [8, "action-space"], [9, "action-space"], [10, "action-space"], [11, "action-space"], [12, "action-space"], [14, "action-space"], [15, "action-space"], [16, "action-space"], [17, "action-space"], [18, "action-space"], [19, "action-space"]], "All Environments": [[5, "all-environments"]], "Arguments": [[6, "arguments"], [7, "arguments"], [8, "arguments"], [9, "arguments"], [10, "arguments"], [11, "arguments"], [12, "arguments"], [14, "arguments"], [15, "arguments"], [16, "arguments"], [17, "arguments"], [18, "arguments"], [19, "arguments"]], "Attributes": [[2, "attributes"], [3, "attributes"]], "Build the Documentation": [[1, "build-the-documentation"]], "Catch": [[6, "catch"]], "Citing": [[20, "citing"]], "Conversion": [[4, "conversion"]], "Credits": [[6, "credits"], [7, "credits"], [10, "credits"], [12, "credits"], [17, "credits"], [19, "credits"]], "Episode Termination": [[6, "episode-termination"], [7, "episode-termination"], [8, "episode-termination"], [10, "episode-termination"], [12, "episode-termination"], [14, "episode-termination"], [15, "episode-termination"], [16, "episode-termination"], [17, "episode-termination"], [19, "episode-termination"]], "Episode Truncation": [[6, "episode-truncation"], [7, "episode-truncation"], [8, "episode-truncation"], [10, "episode-truncation"], [12, "episode-truncation"], [14, "episode-truncation"], [17, "episode-truncation"], [19, "episode-truncation"]], "Escort": [[7, "escort"]], "Install": [[20, "install"], [21, "install"]], "Learning algorithms": [[24, "learning-algorithms"]], "Legal Actions Mask": [[9, "legal-actions-mask"], [11, "legal-actions-mask"], [18, "legal-actions-mask"]], "MO-Beach": [[8, "mo-beach"]], "MO-Breakthrough": [[9, "mo-breakthrough"]], "MO-Congestion": [[10, "mo-congestion"]], "MO-Connect4": [[11, "mo-connect4"]], "MO-GemMining": [[12, "mo-gemmining"]], "MO-Ingenious": [[13, "mo-ingenious"]], "MO-ItemGathering": [[14, "mo-itemgathering"]], "MO-Multiwalker": [[15, "mo-multiwalker"]], "MO-MultiwalkerStability": [[16, "mo-multiwalkerstability"]], "MO-Pistonball": [[17, "mo-pistonball"]], "MO-SameGame": [[18, "mo-samegame"]], "MOAECEnv": [[2, "moaecenv"]], "MOMAland documentation": [[1, "momaland-documentation"]], "MOParallelEnv": [[3, "moparallelenv"]], "Making a Custom Environment": [[23, "making-a-custom-environment"]], "Methods": [[2, "methods"], [3, "methods"]], "Observation Space": [[6, "observation-space"], [7, "observation-space"], [8, "observation-space"], [9, "observation-space"], [10, "observation-space"], [11, "observation-space"], [12, "observation-space"], [14, "observation-space"], [15, "observation-space"], [16, "observation-space"], [17, "observation-space"], [18, "observation-space"], [19, "observation-space"]], "Parallel": [[3, "parallel"], [4, "parallel"]], "Parallel to AEC": [[4, "parallel-to-aec"]], "Release Notes": [[22, "release-notes"]], "Reward Space": [[6, "reward-space"], [7, "reward-space"], [8, "reward-space"], [10, "reward-space"], [12, "reward-space"], [14, "reward-space"], [15, "reward-space"], [16, "reward-space"], [17, "reward-space"], [19, "reward-space"]], "Rewards": [[9, "rewards"], [11, "rewards"], [18, "rewards"]], "Setup pre-commit hooks": [[23, "setup-pre-commit-hooks"]], "Starting State": [[6, "starting-state"], [7, "starting-state"], [8, "starting-state"], [9, "starting-state"], [10, "starting-state"], [11, "starting-state"], [12, "starting-state"], [14, "starting-state"], [17, "starting-state"], [18, "starting-state"], [19, "starting-state"]], "Surround": [[19, "surround"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Usage": [[2, "usage"], [3, "usage"]], "Version History": [[9, "version-history"], [11, "version-history"], [18, "version-history"]], "Wrappers and Utils": [[4, "wrappers-and-utils"]], "v0.0.1: Dummy release": [[22, "release-v0-0-1"]], "v0.0.2: Dummy release 2": [[22, "release-v0-0-2"]]}, "docnames": ["404", "README", "api/aec", "api/parallel", "api/wrappers", "environments/all-envs", "environments/catch", "environments/escort", "environments/mobeach", "environments/mobreakthrough", "environments/mocongestion", "environments/moconnect4", "environments/mogem_mining", "environments/moingenious", "environments/moitem_gathering", "environments/momultiwalker", "environments/momultiwalker_stability", "environments/mopistonball", "environments/mosame_game", "environments/surround", "index", "introduction/install", "release_notes", "tutorials/custom_env", "tutorials/learning_algorithms"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/aec.md", "api/parallel.md", "api/wrappers.md", "environments/all-envs.md", "environments/catch.md", "environments/escort.md", "environments/mobeach.md", "environments/mobreakthrough.md", "environments/mocongestion.md", "environments/moconnect4.md", "environments/mogem_mining.md", "environments/moingenious.md", "environments/moitem_gathering.md", "environments/momultiwalker.md", "environments/momultiwalker_stability.md", "environments/mopistonball.md", "environments/mosame_game.md", "environments/surround.md", "index.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "tutorials/learning_algorithms.md"], "indexentries": {"action_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.action_space", false]], "action_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.action_space", false]], "action_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.action_spaces", false]], "action_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.action_spaces", false]], "agent_selection (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.agent_selection", false]], "agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.agents", false]], "agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.agents", false]], "close() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.close", false]], "close() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.close", false]], "infos (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.infos", false]], "linearizereward (class in momaland.utils.aec_wrappers)": [[4, "momaland.utils.aec_wrappers.LinearizeReward", false]], "linearizereward (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.LinearizeReward", false]], "max_num_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.max_num_agents", false]], "max_num_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.max_num_agents", false]], "mo_aec_to_parallel_wrapper (class in momaland.utils.conversions)": [[4, "momaland.utils.conversions.mo_aec_to_parallel_wrapper", false]], "mo_parallel_to_aec_wrapper (class in momaland.utils.conversions)": [[4, "momaland.utils.conversions.mo_parallel_to_aec_wrapper", false]], "moaecenv (class in momaland.utils.env)": [[2, "momaland.utils.env.MOAECEnv", false]], "moparallelenv (class in momaland.utils.env)": [[3, "momaland.utils.env.MOParallelEnv", false]], "normalizereward (class in momaland.utils.aec_wrappers)": [[4, "momaland.utils.aec_wrappers.NormalizeReward", false]], "normalizereward (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.NormalizeReward", false]], "num_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.num_agents", false]], "num_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.num_agents", false]], "observation_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.observation_space", false]], "observation_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.observation_space", false]], "observation_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.observation_spaces", false]], "observation_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.observation_spaces", false]], "observe() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.observe", false]], "possible_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.possible_agents", false]], "possible_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.possible_agents", false]], "recordepisodestatistics (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.RecordEpisodeStatistics", false]], "render() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.render", false]], "render() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.render", false]], "reset() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.reset", false]], "reset() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.reset", false]], "reward_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.reward_space", false]], "reward_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.reward_space", false]], "reward_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.reward_spaces", false]], "reward_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.reward_spaces", false]], "rewards (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.rewards", false]], "state() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.state", false]], "step() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.step", false]], "step() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.step", false]], "terminations (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.terminations", false]], "truncations (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.truncations", false]]}, "objects": {"momaland.utils.aec_wrappers": [[4, 0, 1, "", "LinearizeReward"], [4, 0, 1, "", "NormalizeReward"]], "momaland.utils.conversions": [[4, 0, 1, "", "mo_aec_to_parallel_wrapper"], [4, 0, 1, "", "mo_parallel_to_aec_wrapper"]], "momaland.utils.env": [[2, 0, 1, "", "MOAECEnv"], [3, 0, 1, "", "MOParallelEnv"]], "momaland.utils.env.MOAECEnv": [[2, 1, 1, "", "action_space"], [2, 2, 1, "", "action_spaces"], [2, 2, 1, "", "agent_selection"], [2, 2, 1, "", "agents"], [2, 1, 1, "", "close"], [2, 2, 1, "", "infos"], [2, 2, 1, "", "max_num_agents"], [2, 2, 1, "", "num_agents"], [2, 1, 1, "", "observation_space"], [2, 2, 1, "", "observation_spaces"], [2, 1, 1, "", "observe"], [2, 2, 1, "", "possible_agents"], [2, 1, 1, "", "render"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "reward_space"], [2, 2, 1, "", "reward_spaces"], [2, 2, 1, "", "rewards"], [2, 1, 1, "", "step"], [2, 2, 1, "", "terminations"], [2, 2, 1, "", "truncations"]], "momaland.utils.env.MOParallelEnv": [[3, 1, 1, "", "action_space"], [3, 2, 1, "", "action_spaces"], [3, 2, 1, "", "agents"], [3, 1, 1, "", "close"], [3, 2, 1, "", "max_num_agents"], [3, 2, 1, "", "num_agents"], [3, 1, 1, "", "observation_space"], [3, 2, 1, "", "observation_spaces"], [3, 2, 1, "", "possible_agents"], [3, 1, 1, "", "render"], [3, 1, 1, "", "reset"], [3, 1, 1, "", "reward_space"], [3, 2, 1, "", "reward_spaces"], [3, 1, 1, "", "state"], [3, 1, 1, "", "step"]], "momaland.utils.parallel_wrappers": [[4, 0, 1, "", "LinearizeReward"], [4, 0, 1, "", "NormalizeReward"], [4, 0, 1, "", "RecordEpisodeStatistics"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute"}, "terms": {"": [2, 3, 4, 6, 7, 8, 9, 11, 17, 18, 19, 20, 24], "0": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "00e": 17, "01": 17, "01567": 16, "02": 16, "04": 17, "08": 4, "1": [2, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "10": [6, 7, 12, 14, 18, 19], "100": [8, 15, 16, 17], "100e": 16, "11": [12, 13], "110": [15, 16], "12": [8, 12, 22], "120": 17, "125": 17, "13": 12, "14": 12, "15": [6, 7, 12, 18, 19], "16": 12, "17": 12, "18": [12, 13], "19": [12, 17], "192": 9, "1e": 4, "2": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "20": [9, 11, 12, 17, 22], "200": [6, 7, 19], "2019": 14, "2023": 22, "209": 16, "225": 18, "23": 12, "255": 17, "2880": 13, "2d": [6, 7, 8, 10, 14, 16, 19], "3": [2, 6, 7, 8, 9, 10, 12, 14, 15, 17, 18, 19, 20], "30": 18, "31": [15, 16], "3d": [6, 7, 15, 17, 19], "4": [9, 11, 12, 14, 15, 16], "4199": 10, "42": [2, 3, 12, 20], "457": 17, "46": [15, 16], "46666667": 15, "5": [6, 7, 8, 9, 12, 14, 17, 18, 19], "50625": 18, "54": 16, "567e": 16, "6": [2, 3, 8, 11, 12, 13, 17, 20], "60": 17, "7": [2, 8, 11, 12, 20], "75": 17, "79e": 17, "8": [4, 9, 11, 12, 14, 17], "881808": 8, "8x8": [9, 14], "9": [4, 11, 12], "99": [4, 8], "A": [2, 3, 4, 6, 7, 8, 10, 14, 16, 19, 20], "And": 3, "As": [12, 17], "At": [9, 11], "For": [1, 2, 3, 4, 20], "If": [8, 9, 11, 15, 16, 18, 20], "In": [3, 9, 10, 11], "It": 8, "On": 4, "The": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 24], "There": 9, "These": [2, 3], "To": [1, 20, 21, 24], "With": 11, "_build": 1, "_env": [2, 3, 20], "_of_a_of_current_typ": 8, "_scalartype_co": 2, "a_typ": 8, "about": 1, "abov": [17, 18], "accept": 2, "access": [2, 4], "accord": 8, "accumul": [2, 18], "action": [2, 3, 5, 13, 20, 24], "action_mask": [9, 11, 13, 18], "action_spac": [2, 3, 20], "actiontyp": [2, 3], "ad": [2, 3, 12], "adapt": [6, 7, 10, 15, 16, 17, 19], "add": [4, 23], "addit": [9, 11], "addition": [9, 11, 18, 23], "adversari": 5, "aec": [17, 20, 21, 23], "aec_env": 4, "aec_wrapp": 4, "aecwrapp": 4, "after": [2, 8, 10, 12], "agent": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 23], "agent_0": 4, "agent_1": 4, "agent_i": [6, 7, 8, 10, 12, 13, 14, 18, 19], "agent_it": [2, 20], "agent_select": 2, "agentid": [2, 3], "aka": [2, 20], "algorithm": [20, 21], "aliv": [15, 16], "all": [2, 3, 8, 9, 11, 12, 14, 18, 20, 21], "all_modul": 23, "also": [2, 4, 8, 9, 20], "altern": 3, "alternatingli": 9, "alwai": 10, "amount": [6, 7, 17, 19], "an": [2, 3, 4, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18, 19, 20, 23], "analysi": [2, 20], "angl": 16, "ani": [2, 9, 11, 12, 18, 24], "anoth": [12, 18], "ansi": [2, 3], "api": [2, 3, 4, 21], "appli": 4, "appropri": 3, "ar": [2, 3, 4, 6, 7, 8, 9, 10, 11, 16, 17, 18, 19, 23, 24], "area": [6, 7, 19], "around": 5, "arrai": [2, 3, 4, 6, 7, 19, 20], "assign": [2, 20], "autobuild": 1, "automat": [1, 2], "avail": [9, 11, 14, 15, 16, 18], "averag": [4, 6, 7, 19], "avoid": [4, 6, 7, 9, 10, 16, 19], "award": [9, 11], "b": 1, "ball": 17, "ball_elast": 17, "ball_frict": 17, "ball_mass": 17, "bandit": 12, "bargiacchi": 12, "base": [2, 3, 4, 9, 10, 11, 12, 16, 18, 20], "baselin": 24, "basic": [20, 21], "beach": 5, "becom": 18, "been": [11, 14], "befor": 17, "behavior": 4, "below": [9, 11, 18], "bernoulli": 12, "between": [4, 5, 17, 18, 20], "binari": [9, 11, 18], "board": [9, 11, 13, 18], "board_height": [9, 11, 18], "board_siz": 11, "board_width": [9, 11, 18], "bonu": 12, "bool": [2, 3], "both": [9, 11, 16], "bottom": 11, "bound": [15, 16], "box": [6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "braess": 10, "break": 5, "breakthrough": 5, "bump": 22, "call": [2, 18], "can": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 17, 18, 19, 20, 21], "cannot": [2, 3, 11], "capac": 8, "captur": 9, "case": [9, 10, 11], "catch": 5, "catch_v0": 6, "cbox": 12, "cd": 1, "cell": [9, 11, 14], "central": 3, "certain": [20, 21], "chang": [1, 2, 3, 4, 8, 16, 17], "check": [2, 4, 20, 22, 23], "choos": 10, "circl": 5, "class": [2, 3, 4, 20, 23], "classic": [2, 3], "cleanrl": 24, "close": [2, 3, 17, 18, 20, 24], "closer": 17, "code": [4, 6, 7, 10, 12, 17, 19], "codebas": 10, "colab": [2, 20], "collid": [6, 7, 19], "collis": [6, 7, 19], "color": 18, "color_reward": 18, "column": [11, 18], "column_object": 11, "commun": 20, "compar": 20, "compat": 24, "compliant": 20, "compon": [17, 20, 21], "condit": [6, 7, 19], "conflict": 11, "congest": 5, "connect": [2, 11, 12, 18], "connect4": 5, "constant": 10, "constructor": 23, "consumpt": 8, "contain": [1, 2, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 24], "continu": [5, 6, 7, 8, 15, 16, 17, 19, 24], "contribut": 1, "control": 2, "convers": 23, "convert": 4, "cooper": [5, 12, 17], "coordin": [6, 7, 9, 18, 19, 20], "corner": 5, "correctli": 4, "correl": 12, "correlated_object": 12, "correspond": [2, 8, 9, 10, 11, 12], "cost": 10, "could": [2, 3], "count": 18, "creat": [2, 20, 23], "current": [2, 3, 8, 9, 11, 18, 24], "customiz": 12, "cycl": 17, "d": 18, "data": 3, "decentr": 3, "decis": [2, 20], "default": [2, 3, 8, 11, 12, 14, 15, 16, 17, 18], "defaultli": 12, "defin": 23, "definit": [2, 20], "depend": [4, 10, 20, 21], "describ": [9, 11, 18], "descript": 5, "destin": [5, 10], "detail": [2, 3, 20], "determin": 14, "develop": 20, "diagon": [9, 11], "dict": [2, 3, 4, 9, 11, 13, 18], "dictionari": [3, 9, 11, 18, 23], "diederik": 12, "differ": [2, 8, 10, 12, 18, 20], "dimens": [9, 11, 18], "direct": [6, 7, 19], "directli": 2, "directori": [23, 24], "dirhtml": 1, "disappear": 18, "discord": 20, "discount": 4, "discret": [5, 8, 9, 10, 11, 12, 13, 14, 17, 18, 24], "disentangl": 17, "displai": [2, 3, 6, 7, 10, 19], "distanc": [5, 6, 7, 15, 16, 19], "distance_other_dron": 5, "distance_target": 5, "distribut": 8, "divid": 9, "do": [9, 11], "doc": 1, "document": [2, 3, 15, 16, 20, 21, 23], "doe": [2, 20, 21], "domain": [8, 12], "don": 23, "down": [14, 17, 18], "draw": [9, 11], "driver": 10, "drone": [5, 6, 7, 19], "drop": [11, 15, 16, 17], "dtype": 2, "due": 12, "duplic": 4, "dure": [15, 16], "e": [1, 2, 3, 12, 23], "each": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 14, 17, 18, 19, 20, 23, 24], "edg": 17, "either": [9, 10, 11, 18], "elast": 17, "element": [9, 11, 15, 16, 18], "els": [2, 20], "empti": [9, 11, 14, 18], "encod": [9, 11, 18], "end": [4, 11, 15, 16], "enforc": [2, 3], "entir": 18, "entri": 14, "env": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 23], "env_nam": 23, "environ": [2, 3, 4, 6, 7, 8, 10, 12, 13, 14, 15, 16, 17, 19, 20, 24], "episod": 4, "epsilon": 4, "equal": [8, 11, 12], "equival": [2, 3], "escap": 6, "escort": 5, "escort_v0": 7, "essenti": 20, "etc": 3, "eugenio": 12, "evalu": 24, "even": [15, 16], "everi": [1, 2, 3, 11, 18], "everyth": [20, 21, 23, 24], "exampl": [2, 4, 6, 7, 8, 19, 20, 23], "except": [9, 11, 18], "exclud": 12, "exclus": [9, 11, 18], "execut": [2, 3], "exert": [15, 16], "exist": 11, "expect": 12, "exponenti": 4, "export": 23, "extend": [2, 3, 9, 11, 18, 23], "factor": [4, 11], "factori": 23, "fall": [11, 15, 16, 18], "fals": [14, 18], "farama": 20, "faster": [9, 11], "felten": [6, 7, 19], "few": 4, "file": 24, "fill": [9, 11, 18], "final": [7, 19], "final_target_loc": [7, 19], "find": 12, "finish": 17, "first": [2, 9, 16], "fix": [4, 5], "float": [2, 3, 4, 6, 7, 10, 19], "float32": [6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "folder": 1, "follow": [3, 6, 7, 16, 19, 20], "forc": [15, 16], "fork": 1, "format": 5, "forward": 9, "found": [9, 11, 12, 18], "four": 11, "fourth": 9, "frame": 3, "friction": 17, "from": [2, 3, 5, 6, 7, 9, 10, 11, 12, 16, 17, 18, 19, 20, 23, 24], "front": 9, "full": 11, "fulli": 12, "function": [2, 3, 12, 20, 23], "g": 23, "game": [5, 9, 11, 13, 18], "gamma": 4, "gap": 18, "gather": [5, 14], "gem": [5, 12], "gener": [2, 3, 12], "get": [9, 11, 18], "github": 22, "give": [15, 16], "given": [8, 9, 11, 12, 17, 18, 23], "global": [3, 8, 17], "go": 1, "greater": 12, "grid": [9, 11, 14, 18], "ground": [6, 7, 19], "group": 18, "guid": 21, "gym": 3, "gymnasium": [2, 3], "ha": [2, 3, 4, 8, 9, 11, 12, 18], "handl": 4, "have": [4, 9, 10, 11, 14, 20, 23], "height": [9, 11, 18], "heintz": 14, "henc": 12, "here": [2, 20, 24], "heterogen": 10, "higher": [15, 16], "hip": [15, 16], "hold": [9, 11, 18], "home": 9, "horizont": [11, 18], "how": [1, 6, 7, 17, 19], "http": 20, "human": [2, 3, 6, 7, 10, 11, 17, 19, 20], "i": [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24], "id": [8, 12, 14], "ident": 9, "idx": 4, "imag": 17, "immedi": 4, "implement": [2, 3, 24], "import": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "incentiv": [9, 11], "includ": [5, 20, 21], "index": [4, 9, 11, 18], "indic": [9, 11, 18, 24], "individu": 18, "inf": [6, 7, 15, 16, 19], "info": [2, 3, 20], "inform": 1, "ingeni": 5, "inherit": 4, "init_flying_po": [6, 7, 19], "init_target_loc": [6, 7, 19], "initi": [4, 6, 7, 8, 14, 18, 19, 23], "initial_map": 14, "inproceed": 20, "input": 4, "insert": [2, 3, 20], "insid": 23, "instal": [1, 23], "instanc": [2, 4, 12, 20], "instantan": 2, "instanti": 4, "instead": [20, 23], "int": [2, 3, 6, 7, 8, 10, 17, 19], "int32": 13, "int64": 14, "int8": [9, 11, 13, 18], "integ": [2, 3, 9, 11, 12, 14, 18], "interact": [2, 3, 20], "intermedi": [7, 19], "intern": 2, "isn": 12, "item": [5, 14], "its": 5, "join": 20, "joint": [15, 16], "just": 12, "keep": [4, 24], "kei": [2, 3, 4], "knee": [15, 16], "k\u00e4llstr\u00f6m": 14, "land": 11, "languag": 12, "last": [2, 8, 9, 12, 20], "latenc": 10, "learn": [6, 7, 10, 19, 20, 21], "least": 18, "left": [8, 9, 14, 18], "length": [2, 3, 6, 7, 8, 12, 19], "less": 12, "level": [8, 15, 16], "librari": [20, 24], "like": [2, 3, 4, 18, 24], "limit": [12, 17], "linear": [4, 24], "linearizereward": [2, 4, 20], "linearreward": 3, "list": [2, 3, 24], "literatur": 5, "live": 12, "local": [8, 12, 17], "locat": [9, 11, 18], "look": 2, "lose": [9, 11], "lost": 9, "lower": [15, 16, 17], "made": [1, 11], "mai": [2, 3], "main": [9, 11, 18], "maintain": 5, "make": [1, 2, 20], "map": 14, "margin": 10, "marl": 5, "mass": 17, "max": 9, "max_connect": 12, "max_cycl": 17, "max_mov": 9, "max_num_ag": [2, 3], "max_prob": 12, "max_work": 12, "maxim": [6, 7, 15, 16, 19], "maximis": 17, "maximum": [8, 12, 14, 17], "mct": 10, "md": 1, "mean": [9, 11, 18], "member": [2, 3, 23], "met": [6, 7, 19], "method": 23, "min_connect": 12, "min_prob": 12, "min_work": 12, "mine": [5, 12], "minim": [6, 7, 10, 17, 19], "minimis": 10, "minimum": 12, "mixtur": 8, "mo": [4, 5], "mo_aec_to_parallel_wrapp": 4, "mo_parallel_to_aec": 23, "mo_parallel_to_aec_wrapp": 4, "moaec": 2, "moaecenv": 23, "mobeach_v0": [8, 23], "mobil": 5, "mobreakthrough_v0": 9, "mocongestion_v0": 10, "moconnect4_v0": 11, "mode": [2, 3, 6, 7, 8, 9, 10, 11, 12, 14, 17, 18, 19], "model": [2, 20], "modifi": 9, "modul": 4, "mogem_mining_v0": 12, "moingenious_v0": 13, "moitem_gathering_v0": 14, "momaland": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24], "momappo": 24, "momarl": 20, "momultiwalk": [2, 3, 20], "momultiwalker_stability_v0": 16, "momultiwalker_v0": [2, 3, 15, 20], "monetari": 10, "moparallel": 3, "moparallelenv": 23, "mopistonball_v0": 17, "more": [1, 2, 3, 11, 20], "morl": 24, "mosame_game_v0": 18, "most": 12, "move": [4, 6, 7, 8, 9, 11, 17, 18, 19], "move_count": [9, 11], "multi": [2, 3, 5, 9, 10, 11, 14, 18, 20, 24], "multibinari": 9, "multipli": 12, "multiwalk": [5, 16], "must": [2, 3, 4, 5], "n": [2, 18], "n_piston": 17, "name": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 24], "nativ": 4, "ndarrai": [2, 3], "need": [10, 17], "neg": [9, 12, 14], "negat": [9, 11], "network": [2, 10], "nevertheless": 24, "new": [4, 23], "newli": 4, "next": [2, 17], "non": 12, "none": [2, 3, 6, 7, 8, 10, 14, 17, 19, 20], "normal": 4, "normalizereward": 4, "note": [2, 12], "notebook": [2, 20], "np": [2, 3, 4, 20], "nparrai": [6, 7, 19], "nth": 2, "num_ag": [2, 3, 8, 10, 12, 18], "num_color": 18, "num_dron": [6, 7, 19], "num_intermediate_point": [7, 19], "num_object": [9, 12, 18], "num_timestep": [8, 10, 12, 14], "number": [7, 8, 9, 10, 11, 12, 14, 17, 18, 19], "numpi": [2, 3, 20], "ob": 5, "object": [2, 3, 4, 5, 8, 9, 10, 11, 12, 14, 16, 18, 20, 24], "observ": [2, 3, 13, 20, 24], "observation_spac": [2, 3], "obstyp": [2, 3], "occup": 8, "occupi": 8, "occur": 14, "od": 10, "ol": 24, "onc": 1, "one": [6, 7, 9, 11, 15, 16, 18, 19], "onli": [8, 9, 18], "open": 20, "oppon": [9, 11], "oppos": [2, 3], "option": [2, 3, 6, 7, 9, 10, 11, 17, 19, 20], "order": [6, 7, 18, 19], "org": 20, "origin": [10, 17], "other": [2, 6, 7, 9, 11, 19, 24], "our": [1, 23], "output": 4, "outsid": [2, 3], "over": 8, "overrid": [2, 3, 4, 23], "own": [4, 9, 18], "packag": [1, 15, 16, 23], "pair": 10, "paper": 24, "paradox": 10, "parallel": [6, 7, 8, 10, 14, 19, 21, 23], "parallel_env": [3, 4, 23], "parallel_to_aec": 23, "parallel_wrapp": 4, "paramet": 4, "past": 4, "penal": 16, "penalti": [15, 16, 17], "per": [2, 3, 12, 20], "percentag": [8, 10], "perform": 24, "pettingzoo": [2, 3, 5, 15, 16, 20, 23], "philosophi": 24, "piec": 9, "pip": [1, 20, 21, 23], "piston": 17, "piston_i": 17, "pistonbal": 5, "place": [8, 9, 10, 11, 17], "placement": [9, 11], "plai": [2, 3, 18], "plane": [9, 11, 18], "player": [9, 11, 18], "player_i": [9, 11], "pleas": [12, 20], "point": [5, 7, 9, 10, 11, 18, 19], "polici": [2, 3, 4, 20, 24], "posit": [6, 7, 8, 14, 19], "position_distribut": 8, "possibl": [10, 24], "possible_ag": [2, 3, 4], "practic": 23, "prefer": 10, "previou": 12, "print": [2, 3, 4], "probabl": 12, "problem": [8, 14], "problem_nam": 10, "problemat": [20, 21], "program": 12, "progress": [2, 3], "proport": 17, "provid": [12, 20, 24], "public": 20, "pure": 23, "puzzl": 18, "py": 23, "pypi": 22, "pytest": 23, "python": [2, 20], "pz": [2, 3, 4, 20, 23], "qmix": 3, "r": 1, "rack": 13, "rais": 17, "random": [8, 10, 17], "random_drop": 17, "random_toll_percentag": 10, "randomis": 14, "randomli": [8, 10, 12, 18], "rang": 4, "rather": 2, "raw_env": 23, "reach": [6, 7, 8, 9, 11, 14, 17, 19], "reachabl": 12, "realli": 12, "rebuild": 1, "receiv": [3, 8, 12], "recent": 4, "record": 4, "recordepisodestatist": 4, "rectangular": 18, "reimplement": 12, "reinforc": 20, "releas": 2, "remov": [2, 3, 18], "render": [2, 3, 6, 7, 8, 9, 10, 11, 12, 14, 17, 18, 19], "render_mod": [2, 3, 6, 7, 8, 9, 10, 11, 12, 14, 17, 18, 19, 20], "repositori": [20, 23], "repres": [4, 6, 7, 9, 10, 11, 12, 14, 15, 16, 18, 19], "requir": [1, 20, 21], "research": 20, "reset": [2, 3, 20], "resourc": 2, "respect": [3, 11], "return": [2, 3, 20, 23], "reus": 24, "reward": [2, 3, 4, 13, 20, 23, 24], "reward_schem": 8, "reward_spac": [2, 3, 4, 23], "rgb": 17, "rgb_arrai": [2, 3, 11, 17], "right": [8, 9, 14, 17, 18], "rl": [2, 9, 11, 18, 20], "road": 10, "roijer": 12, "rout": 10, "row": 9, "run": [14, 23], "same": [2, 3, 5, 9, 11, 12, 18], "sampl": [2, 3, 20], "scalar": [2, 3, 4, 17, 20], "scale": [4, 11], "scheme": 8, "score": 13, "screen": 11, "screen_scal": 11, "second": [2, 9, 11, 16], "section": [8, 9, 11, 18], "section_capac": 8, "section_consumpt": 8, "section_id": 8, "see": [2, 3, 12, 15, 16, 20, 21, 23], "seed": [2, 3, 12, 20], "select": [2, 10, 12, 18], "self": [2, 23, 24], "send": 12, "separ": 18, "sequenc": 11, "sequenti": 18, "server": 20, "set": [9, 11, 12, 17, 18, 20, 24], "shake": 16, "shape": [4, 6, 7, 10, 19, 23], "share": 18, "shift": [2, 20], "should": [2, 6, 7, 11, 12, 19, 23], "side": [6, 7, 19], "similar": [2, 4, 20], "simpl": [2, 20], "singl": [2, 9, 11, 15, 16, 18, 20, 24], "sister": 16, "size": [6, 7, 18, 19], "so": [3, 4, 10], "some": [4, 20, 21], "sourc": [2, 3, 4, 6, 7, 10, 19, 20], "space": [2, 3, 4, 5, 13, 23, 24], "specif": [2, 3, 9, 11, 12, 18], "specifi": [2, 17, 23], "speed": [6, 7, 19], "sphinx": 1, "split": 4, "squar": [9, 18], "stabil": 4, "stai": [8, 14, 17], "stand": 11, "standard": [2, 3, 20], "start": 2, "state": [2, 3], "stateless": [10, 12], "static": 19, "statist": 4, "step": [2, 3, 6, 7, 15, 16, 19, 20], "still": [15, 16, 17], "store": 2, "str": [2, 3, 6, 7, 8, 10, 19], "straight": 9, "string": [2, 3], "structur": 2, "subprocess": 2, "successfulli": 11, "sum": 8, "suppli": [20, 21], "support": [2, 3], "surround": [5, 6], "surround_v0": 19, "survei": [2, 20], "switch": 2, "system": [20, 21], "t": [4, 12, 23], "take": [2, 3, 4, 10, 17], "taken": [2, 5], "target": [5, 6, 7, 19], "target_spe": [6, 7, 19], "tax": 10, "team": [18, 24], "team_reward": 18, "tensor": [9, 11, 18], "termin": [2, 3, 20], "terminate_on_fal": [15, 16], "test": [20, 21, 23], "than": 11, "thei": [9, 11, 18], "them": [2, 4, 9, 11, 17, 20], "themselv": 5, "therefor": [10, 12], "thi": [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 17, 18, 19, 20, 21, 23], "third": 9, "three": 9, "through": [2, 3], "tile": 18, "time": [1, 2, 9, 10, 11, 17], "time_penalti": 17, "timestep": [6, 7, 8, 10, 12, 14, 19], "todo": [5, 20], "togeth": 12, "token": 11, "toll": 10, "toll_mod": 10, "tool": 24, "top": [4, 11], "total": 12, "toward": [6, 7, 15, 16, 17, 19], "train": 3, "trajectori": [4, 7, 19], "transform": 4, "travel": [6, 7, 10, 15, 16, 19], "true": [12, 15, 16, 17, 18], "trunc_prob": 12, "truncat": [2, 3, 20], "try": [6, 9, 22], "tupl": [3, 8, 14], "turn": [9, 11, 18], "two": [8, 9, 10, 11, 17, 18], "txt": 1, "type": [2, 3, 4, 8, 12, 14], "type_distribut": 8, "typic": [2, 3], "uint8": 17, "unchang": 17, "under": 10, "uniform": 8, "until": 11, "up": [9, 14, 17], "upper": 12, "us": [2, 4, 8, 10, 11, 12, 17, 20, 21, 23], "usag": [20, 21], "usual": [9, 11, 18], "util": [2, 3, 20, 23, 24], "v0": 5, "valid": 4, "valu": [2, 3, 4, 6, 7, 8, 11, 12, 16, 17, 19, 20], "variabl": 2, "varianc": 4, "variant": [9, 11, 18], "vec_reward": [2, 3, 20], "vector": [2, 4, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 20, 23], "vectori": 4, "veri": [2, 20], "version": [5, 10, 22, 23], "vertic": [11, 18], "via": 8, "view": 3, "villag": 12, "w": 12, "w_bonu": 12, "wa": [4, 6, 7, 10, 12, 17, 19], "wai": 18, "walker_0": [2, 20], "walker_1": [2, 20], "walker_2": [2, 20], "walker_i": [15, 16], "wall": 17, "we": [2, 20, 24], "websit": 20, "weight": [2, 3, 4, 20], "well": [5, 20, 23], "were": 18, "when": [6, 7, 11, 17, 18, 19], "where": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18, 19, 20], "whether": [9, 11, 14, 17, 18], "which": [2, 3, 6, 7, 9, 11, 12, 16, 18, 19, 20, 23], "while": [3, 5, 6, 7, 10, 19], "whose": [4, 9, 11, 18], "width": [9, 11, 18], "win": [9, 11], "window": [2, 3, 17], "without": [5, 11], "work": [20, 23], "worker": 12, "workflow": 22, "would": [2, 3, 20], "x": [9, 11, 18], "x_0": [6, 7, 19], "x_1": [6, 7, 19], "x_n": [6, 7, 19], "x_targ": [6, 7, 19], "xyz": [6, 7, 19], "y": [9, 18], "y_0": [6, 7, 19], "y_1": [6, 7, 19], "y_n": [6, 7, 19], "y_targ": [6, 7, 19], "you": [2, 3, 20, 23], "your": [1, 2, 3, 20, 23], "z": 9, "z_0": [6, 7, 19], "z_1": [6, 7, 19], "z_n": [6, 7, 19], "z_targ": [6, 7, 19], "zero": [9, 11, 18]}, "titles": ["404 - Page Not Found", "MOMAland documentation", "AEC", "Parallel", "Wrappers and Utils", "All Environments", "Catch", "Escort", "MO-Beach", "MO-Breakthrough", "MO-Congestion", "MO-Connect4", "MO-GemMining", "MO-Ingenious", "MO-ItemGathering", "MO-Multiwalker", "MO-MultiwalkerStability", "MO-Pistonball", "MO-SameGame", "Surround", "API", "Install", "Release Notes", "Making a Custom Environment", "Learning algorithms"], "titleterms": {"0": 22, "1": 22, "2": 22, "404": 0, "Not": 0, "The": 0, "action": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19], "aec": [2, 4], "algorithm": 24, "all": 5, "api": 20, "argument": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19], "attribut": [2, 3], "beach": 8, "breakthrough": 9, "build": 1, "catch": 6, "cite": 20, "commit": 23, "congest": 10, "connect4": 11, "convers": 4, "could": 0, "credit": [6, 7, 10, 12, 17, 19], "custom": 23, "document": 1, "dummi": 22, "environ": [5, 23], "episod": [6, 7, 8, 10, 12, 14, 15, 16, 17, 19], "escort": 7, "found": 0, "gemmin": 12, "histori": [9, 11, 18], "hook": 23, "ingeni": 13, "instal": [20, 21], "itemgath": 14, "learn": 24, "legal": [9, 11, 18], "make": 23, "mask": [9, 11, 18], "method": [2, 3], "mo": [8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18], "moaecenv": 2, "momaland": 1, "moparallelenv": 3, "multiwalk": 15, "multiwalkerst": 16, "note": 22, "observ": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19], "page": 0, "parallel": [3, 4], "pistonbal": 17, "pre": 23, "releas": 22, "request": 0, "reward": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19], "samegam": 18, "setup": 23, "space": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19], "start": [6, 7, 8, 9, 10, 11, 12, 14, 17, 18, 19], "state": [6, 7, 8, 9, 10, 11, 12, 14, 17, 18, 19], "surround": 19, "termin": [6, 7, 8, 10, 12, 14, 15, 16, 17, 19], "truncat": [6, 7, 8, 10, 12, 14, 17, 19], "usag": [2, 3], "util": 4, "v0": 22, "version": [9, 11, 18], "wrapper": 4}}) \ No newline at end of file +Search.setIndex({"alltitles": {"0.1.0": [[21, "release-0-1-0"]], "404 - Page Not Found": [[0, "page-not-found"]], "AEC": [[2, "aec"], [4, "aec"]], "AEC to Parallel": [[4, "aec-to-parallel"]], "API": [[19, "api"]], "Action Space": [[6, "action-space"], [7, "action-space"], [8, "action-space"], [9, "action-space"], [10, "action-space"], [11, "action-space"], [12, "action-space"], [14, "action-space"], [15, "action-space"], [16, "action-space"], [17, "action-space"], [18, "action-space"]], "All Environments": [[5, "all-environments"]], "Arguments": [[6, "arguments"], [7, "arguments"], [8, "arguments"], [9, "arguments"], [10, "arguments"], [11, "arguments"], [12, "arguments"], [14, "arguments"], [15, "arguments"], [16, "arguments"], [17, "arguments"], [18, "arguments"]], "Attributes": [[2, "attributes"], [3, "attributes"]], "Build the Documentation": [[1, "build-the-documentation"]], "Catch": [[6, "catch"]], "Citing": [[19, "citing"]], "Conversion": [[4, "conversion"]], "Credits": [[6, "credits"], [7, "credits"], [10, "credits"], [12, "credits"], [16, "credits"], [18, "credits"]], "Episode Termination": [[6, "episode-termination"], [7, "episode-termination"], [8, "episode-termination"], [10, "episode-termination"], [12, "episode-termination"], [14, "episode-termination"], [15, "episode-termination"], [16, "episode-termination"], [18, "episode-termination"]], "Episode Truncation": [[6, "episode-truncation"], [7, "episode-truncation"], [8, "episode-truncation"], [10, "episode-truncation"], [12, "episode-truncation"], [14, "episode-truncation"], [16, "episode-truncation"], [18, "episode-truncation"]], "Escort": [[7, "escort"]], "Install": [[19, "install"], [20, "install"]], "Learning algorithms": [[23, "learning-algorithms"]], "Legal Actions Mask": [[9, "legal-actions-mask"], [11, "legal-actions-mask"], [17, "legal-actions-mask"]], "MO-Beach": [[8, "mo-beach"]], "MO-Breakthrough": [[9, "mo-breakthrough"]], "MO-Congestion": [[10, "mo-congestion"]], "MO-Connect4": [[11, "mo-connect4"]], "MO-GemMining": [[12, "mo-gemmining"]], "MO-Ingenious": [[13, "mo-ingenious"]], "MO-ItemGathering": [[14, "mo-itemgathering"]], "MO-MultiwalkerStability": [[15, "mo-multiwalkerstability"]], "MO-Pistonball": [[16, "mo-pistonball"]], "MO-SameGame": [[17, "mo-samegame"]], "MOAECEnv": [[2, "moaecenv"]], "MOMAland documentation": [[1, "momaland-documentation"]], "MOParallelEnv": [[3, "moparallelenv"]], "Making a Custom Environment": [[22, "making-a-custom-environment"]], "Methods": [[2, "methods"], [3, "methods"]], "Observation Space": [[6, "observation-space"], [7, "observation-space"], [8, "observation-space"], [9, "observation-space"], [10, "observation-space"], [11, "observation-space"], [12, "observation-space"], [14, "observation-space"], [15, "observation-space"], [16, "observation-space"], [17, "observation-space"], [18, "observation-space"]], "Parallel": [[3, "parallel"], [4, "parallel"]], "Parallel to AEC": [[4, "parallel-to-aec"]], "Release Notes": [[21, "release-notes"]], "Reward Space": [[6, "reward-space"], [7, "reward-space"], [8, "reward-space"], [10, "reward-space"], [12, "reward-space"], [14, "reward-space"], [15, "reward-space"], [16, "reward-space"], [18, "reward-space"]], "Rewards": [[9, "rewards"], [11, "rewards"], [17, "rewards"]], "Setup pre-commit hooks": [[22, "setup-pre-commit-hooks"]], "Starting State": [[6, "starting-state"], [7, "starting-state"], [8, "starting-state"], [9, "starting-state"], [10, "starting-state"], [11, "starting-state"], [12, "starting-state"], [14, "starting-state"], [16, "starting-state"], [17, "starting-state"], [18, "starting-state"]], "Surround": [[18, "surround"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Usage": [[2, "usage"], [3, "usage"]], "Version History": [[9, "version-history"], [11, "version-history"], [17, "version-history"]], "Wrappers and Utils": [[4, "wrappers-and-utils"]], "v0.0.1: Dummy release": [[21, "release-v0-0-1"]], "v0.0.2: Dummy release 2": [[21, "release-v0-0-2"]]}, "docnames": ["404", "README", "api/aec", "api/parallel", "api/wrappers", "environments/all-envs", "environments/catch", "environments/escort", "environments/mobeach", "environments/mobreakthrough", "environments/mocongestion", "environments/moconnect4", "environments/mogem_mining", "environments/moingenious", "environments/moitem_gathering", "environments/momultiwalker_stability", "environments/mopistonball", "environments/mosame_game", "environments/surround", "index", "introduction/install", "release_notes", "tutorials/custom_env", "tutorials/learning_algorithms"], "envversion": {"sphinx": 61, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1}, "filenames": ["404.md", "README.md", "api/aec.md", "api/parallel.md", "api/wrappers.md", "environments/all-envs.md", "environments/catch.md", "environments/escort.md", "environments/mobeach.md", "environments/mobreakthrough.md", "environments/mocongestion.md", "environments/moconnect4.md", "environments/mogem_mining.md", "environments/moingenious.md", "environments/moitem_gathering.md", "environments/momultiwalker_stability.md", "environments/mopistonball.md", "environments/mosame_game.md", "environments/surround.md", "index.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "tutorials/learning_algorithms.md"], "indexentries": {"action_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.action_space", false]], "action_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.action_space", false]], "action_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.action_spaces", false]], "action_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.action_spaces", false]], "agent_selection (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.agent_selection", false]], "agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.agents", false]], "agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.agents", false]], "close() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.close", false]], "close() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.close", false]], "infos (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.infos", false]], "linearizereward (class in momaland.utils.aec_wrappers)": [[4, "momaland.utils.aec_wrappers.LinearizeReward", false]], "linearizereward (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.LinearizeReward", false]], "max_num_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.max_num_agents", false]], "max_num_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.max_num_agents", false]], "mo_aec_to_parallel_wrapper (class in momaland.utils.conversions)": [[4, "momaland.utils.conversions.mo_aec_to_parallel_wrapper", false]], "mo_parallel_to_aec_wrapper (class in momaland.utils.conversions)": [[4, "momaland.utils.conversions.mo_parallel_to_aec_wrapper", false]], "moaecenv (class in momaland.utils.env)": [[2, "momaland.utils.env.MOAECEnv", false]], "moparallelenv (class in momaland.utils.env)": [[3, "momaland.utils.env.MOParallelEnv", false]], "normalizereward (class in momaland.utils.aec_wrappers)": [[4, "momaland.utils.aec_wrappers.NormalizeReward", false]], "normalizereward (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.NormalizeReward", false]], "num_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.num_agents", false]], "num_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.num_agents", false]], "observation_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.observation_space", false]], "observation_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.observation_space", false]], "observation_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.observation_spaces", false]], "observation_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.observation_spaces", false]], "observe() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.observe", false]], "possible_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.possible_agents", false]], "possible_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.possible_agents", false]], "recordepisodestatistics (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.RecordEpisodeStatistics", false]], "render() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.render", false]], "render() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.render", false]], "reset() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.reset", false]], "reset() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.reset", false]], "reward_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.reward_space", false]], "reward_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.reward_space", false]], "reward_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.reward_spaces", false]], "reward_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.reward_spaces", false]], "rewards (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.rewards", false]], "state() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.state", false]], "step() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.step", false]], "step() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.step", false]], "terminations (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.terminations", false]], "truncations (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.truncations", false]]}, "objects": {"momaland.utils.aec_wrappers": [[4, 0, 1, "", "LinearizeReward"], [4, 0, 1, "", "NormalizeReward"]], "momaland.utils.conversions": [[4, 0, 1, "", "mo_aec_to_parallel_wrapper"], [4, 0, 1, "", "mo_parallel_to_aec_wrapper"]], "momaland.utils.env": [[2, 0, 1, "", "MOAECEnv"], [3, 0, 1, "", "MOParallelEnv"]], "momaland.utils.env.MOAECEnv": [[2, 1, 1, "", "action_space"], [2, 2, 1, "", "action_spaces"], [2, 2, 1, "", "agent_selection"], [2, 2, 1, "", "agents"], [2, 1, 1, "", "close"], [2, 2, 1, "", "infos"], [2, 2, 1, "", "max_num_agents"], [2, 2, 1, "", "num_agents"], [2, 1, 1, "", "observation_space"], [2, 2, 1, "", "observation_spaces"], [2, 1, 1, "", "observe"], [2, 2, 1, "", "possible_agents"], [2, 1, 1, "", "render"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "reward_space"], [2, 2, 1, "", "reward_spaces"], [2, 2, 1, "", "rewards"], [2, 1, 1, "", "step"], [2, 2, 1, "", "terminations"], [2, 2, 1, "", "truncations"]], "momaland.utils.env.MOParallelEnv": [[3, 1, 1, "", "action_space"], [3, 2, 1, "", "action_spaces"], [3, 2, 1, "", "agents"], [3, 1, 1, "", "close"], [3, 2, 1, "", "max_num_agents"], [3, 2, 1, "", "num_agents"], [3, 1, 1, "", "observation_space"], [3, 2, 1, "", "observation_spaces"], [3, 2, 1, "", "possible_agents"], [3, 1, 1, "", "render"], [3, 1, 1, "", "reset"], [3, 1, 1, "", "reward_space"], [3, 2, 1, "", "reward_spaces"], [3, 1, 1, "", "state"], [3, 1, 1, "", "step"]], "momaland.utils.parallel_wrappers": [[4, 0, 1, "", "LinearizeReward"], [4, 0, 1, "", "NormalizeReward"], [4, 0, 1, "", "RecordEpisodeStatistics"]]}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute"}, "terms": {"": [2, 3, 4, 5, 6, 7, 8, 9, 11, 16, 17, 18, 19, 21, 23], "0": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "00e": 16, "01": 16, "01567": 15, "02": 15, "03": 21, "04": 16, "05": 21, "08": 4, "1": [2, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18], "10": [6, 7, 12, 14, 17, 18], "100": [8, 15, 16], "100e": 15, "11": [12, 13], "110": 15, "12": [8, 12, 21], "120": 16, "125": 16, "13": 12, "14": 12, "15": [6, 7, 12, 17, 18], "16": 12, "17": 12, "18": [12, 13], "19": [12, 16], "192": 9, "1e": 4, "2": [2, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "20": [9, 11, 12, 16, 21], "200": [6, 7, 18], "2019": 14, "2023": 21, "2024": 21, "209": 15, "21": 21, "225": 17, "23": 12, "24": 21, "25": 21, "255": 16, "26": 21, "27": 21, "28": 21, "2880": 13, "29": 21, "2d": [6, 7, 8, 10, 14, 15, 18], "3": [2, 3, 6, 7, 8, 9, 10, 12, 14, 16, 17, 18, 19], "30": 17, "31": [15, 21], "35": 21, "37": 21, "38": 21, "39": 21, "3d": [6, 7, 16, 18], "4": [5, 9, 11, 12, 14, 15, 21], "40": 21, "41": 21, "4199": 10, "42": [2, 3, 12, 19, 21], "43": 21, "44": 21, "45": 21, "457": 16, "46": [15, 21], "48": 21, "49": 21, "5": [2, 6, 7, 8, 9, 12, 14, 16, 17, 18, 19], "50625": 17, "51": 21, "52": 21, "53": 21, "54": [15, 21], "567e": 15, "6": [8, 11, 12, 13, 16], "60": 16, "7": [2, 3, 8, 11, 12, 19], "75": 16, "79e": 16, "8": [2, 4, 9, 11, 12, 14, 16, 19], "881808": 8, "8x8": [9, 14], "9": [4, 11, 12], "99": [4, 8], "A": [2, 3, 4, 5, 6, 7, 8, 10, 14, 15, 18, 19], "And": 3, "As": [12, 16], "At": [9, 11], "For": [1, 2, 3, 4, 19], "If": [8, 9, 11, 15, 17, 19], "In": [3, 9, 10, 11], "It": 8, "On": 4, "The": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 23], "There": [5, 9], "These": [2, 3], "To": [1, 19, 20, 23], "With": 11, "_build": 1, "_env": [2, 3, 19], "_of_a_of_current_typ": 8, "_scalartype_co": 2, "a_typ": 8, "about": 1, "abov": [16, 17], "absolut": 21, "accept": 2, "access": [2, 4], "accord": 8, "accumul": [2, 5, 17], "action": [2, 3, 5, 13, 19, 23], "action_mask": [9, 11, 13, 17], "action_spac": [2, 3, 19], "actiontyp": [2, 3], "ad": [2, 3, 12], "adapt": [5, 6, 7, 10, 15, 16, 18], "add": [4, 21, 22], "addit": [5, 9, 11], "addition": [5, 9, 11, 17, 22], "adversari": 5, "aec": [16, 19, 20, 21, 22], "aec_env": 4, "aec_wrapp": 4, "aecwrapp": 4, "after": [2, 8, 10, 12], "agent": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 21, 22], "agent_": 5, "agent_0": 4, "agent_1": 4, "agent_i": [6, 7, 8, 10, 12, 13, 14, 17, 18], "agent_it": [2, 19], "agent_select": 2, "agentid": [2, 3], "aka": [2, 19], "algorithm": [19, 20], "aliv": 15, "all": [2, 3, 8, 9, 11, 12, 14, 17, 19, 20], "all_modul": 22, "allow": 5, "also": [2, 4, 5, 8, 9, 19], "altern": 3, "alternatingli": 9, "alwai": 10, "amount": [6, 7, 16, 18], "an": [2, 3, 4, 5, 6, 7, 9, 10, 11, 12, 14, 16, 17, 18, 19, 22], "analysi": [2, 19], "angl": 15, "ani": [2, 5, 9, 11, 12, 17, 23], "anoth": [12, 17], "ansi": [2, 3], "api": [2, 3, 4, 20], "appli": 4, "appropri": 3, "ar": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 15, 16, 17, 18, 22, 23], "area": [6, 7, 18], "around": 5, "arrai": [2, 3, 4, 6, 7, 18, 19], "assign": [2, 19], "attende": 5, "autobuild": 1, "automat": [1, 2], "avail": [5, 9, 11, 14, 15, 17], "averag": [4, 6, 7, 18], "avoid": [4, 5, 6, 7, 9, 10, 15, 18], "award": [9, 11], "b": 1, "baier_2015": 5, "ball": 16, "ball_elast": 16, "ball_frict": 16, "ball_mass": 16, "bandit": 12, "bargiacchi": 12, "bargiacchi_2018": 5, "base": [2, 3, 4, 5, 9, 10, 11, 12, 15, 17, 19], "baselin": 23, "basic": [19, 20], "beach": 5, "becom": 17, "been": [11, 14], "befor": 16, "behavior": 4, "below": [9, 11, 17], "bernoulli": 12, "better": 21, "between": [4, 5, 16, 17, 19], "binari": [9, 11, 17], "board": [5, 9, 11, 13, 17, 21], "board_height": [9, 11, 17], "board_siz": 11, "board_width": [9, 11, 17], "bonu": 12, "bool": [2, 3], "both": [9, 11, 15, 21], "bottom": 11, "bound": 15, "box": [6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18], "bpd": 21, "braess": 10, "break": 5, "breakthrough": [5, 21], "bump": 21, "call": [2, 5, 17], "can": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 16, 17, 18, 19, 20], "cannot": [2, 3, 11], "capac": [5, 8], "captur": [5, 9], "case": [9, 10, 11], "catch": 5, "catch_v0": 6, "cbox": 12, "cd": 1, "cell": [9, 11, 14], "central": [3, 23], "certain": [19, 20], "chang": [1, 2, 3, 4, 8, 15, 16, 21], "changelog": 21, "characteris": 5, "check": [2, 4, 19, 21, 22], "choic": 5, "choos": 10, "circl": 5, "class": [2, 3, 4, 19, 22], "classic": [2, 3], "cleanrl": 23, "close": [2, 3, 16, 17, 19, 23], "closer": 16, "code": [4, 6, 7, 10, 12, 16, 18], "codebas": 10, "colab": [2, 19], "collect": 5, "collid": [6, 7, 18], "collis": [6, 7, 18], "color": [5, 17], "color_reward": 17, "colors_n": 5, "colour": 5, "column": [5, 11, 17], "column_object": 11, "commun": 19, "compar": 19, "compat": 23, "competit": 5, "compliant": 19, "compon": [16, 19, 20], "condit": [6, 7, 18], "configur": 5, "conflict": 11, "congest": [5, 21], "connect": [2, 5, 11, 12, 17, 21], "connect4": 5, "constant": 10, "constructor": 22, "consumpt": 8, "contain": [1, 2, 5, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 23], "continu": [5, 6, 7, 8, 15, 16, 18, 23], "contribut": [1, 21], "contributor": 21, "control": 2, "convers": 22, "convert": 4, "cooper": [5, 12, 16], "coordin": [6, 7, 9, 17, 18, 19], "corner": 5, "correctli": 4, "correl": 12, "correlated_object": 12, "correspond": [2, 8, 9, 10, 11, 12], "cost": [5, 10], "could": [2, 3], "count": [5, 17], "crazyrl": 21, "creat": [2, 19, 22], "crowded": 5, "current": [2, 3, 8, 9, 11, 17, 23], "customiz": 12, "cycl": 16, "d": 17, "data": 3, "decentr": 3, "decis": [2, 19], "default": [2, 3, 5, 8, 11, 12, 14, 15, 16, 17], "defaultli": 12, "defin": 22, "definit": [2, 19], "demonstr": 21, "depend": [4, 10, 19, 20], "describ": [9, 11, 17], "descript": 5, "destin": [5, 10], "detail": [2, 3, 19], "determin": 14, "develop": 19, "diagon": [9, 11], "dict": [2, 3, 4, 9, 11, 13, 17], "dictionari": [3, 9, 11, 17, 22], "diederik": 12, "differ": [2, 5, 8, 10, 12, 17, 19], "dimens": [9, 11, 17], "direct": [6, 7, 18], "directli": 2, "directori": [22, 23], "dirhtml": 1, "disappear": 17, "discord": 19, "discount": 4, "discret": [5, 8, 9, 10, 11, 12, 13, 14, 16, 17, 21, 23], "disentangl": 16, "displai": [2, 3, 6, 7, 10, 18], "distanc": [5, 6, 7, 15, 18], "distance_other_dron": 5, "distance_target": 5, "distribut": 8, "divers": 5, "divid": 9, "do": [9, 11], "doc": [1, 21], "document": [2, 3, 15, 19, 20, 21, 22], "doe": [2, 19, 20], "domain": [8, 12], "don": 22, "down": [14, 16, 17], "draw": [9, 11], "driver": [5, 10], "drone": [5, 6, 7, 18], "drop": [11, 15, 16], "dtype": 2, "due": 12, "duplic": 4, "dure": 15, "dynam": 21, "e": [1, 2, 3, 12, 22], "each": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18, 19, 22, 23], "edg": 16, "either": [5, 9, 10, 11, 17], "elast": 16, "element": [9, 11, 15, 17], "els": [2, 19], "empti": [9, 11, 14, 17], "encod": [9, 11, 17], "end": [4, 11, 15], "enforc": [2, 3], "enjoy": 5, "entir": 17, "entri": 14, "env": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 22], "env_nam": 22, "environ": [2, 3, 4, 6, 7, 8, 10, 12, 13, 14, 15, 16, 18, 19, 21, 23], "episod": 4, "epsilon": 4, "equal": [8, 11, 12], "equival": [2, 3], "escap": 6, "escort": 5, "escort_v0": 7, "essenti": [5, 19], "etc": 3, "eugenio": 12, "evalu": [21, 23], "even": 15, "everi": [1, 2, 3, 5, 11, 17], "everyth": [19, 20, 22, 23], "exampl": [2, 4, 6, 7, 8, 18, 19, 22], "except": [9, 11, 17], "exclud": 12, "exclus": [9, 11, 17], "execut": [2, 3], "exert": 15, "exist": 11, "expect": 12, "experiment": 21, "exponenti": 4, "export": 22, "extend": [2, 3, 5, 9, 11, 17, 22], "extens": 5, "extract": 5, "ezpickl": 21, "factor": [4, 11], "factori": 22, "fall": [11, 15, 17], "fals": [14, 17], "farama": 19, "fast": 5, "faster": [9, 11], "featur": 21, "felten": [6, 7, 18], "few": 4, "ffelten": 21, "file": 23, "fill": [9, 11, 17], "final": [7, 18], "final_target_loc": [7, 18], "find": 12, "finish": 16, "first": [2, 9, 15, 21], "fix": [4, 5, 21], "float": [2, 3, 4, 6, 7, 10, 18], "float32": [6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18], "folder": 1, "follow": [3, 6, 7, 15, 18, 19], "forc": 15, "fork": 1, "format": 5, "forward": 9, "found": [9, 11, 12, 17], "four": 11, "fourth": 9, "frame": 3, "friction": 16, "from": [2, 3, 5, 6, 7, 9, 10, 11, 12, 15, 16, 17, 18, 19, 22, 23], "front": 9, "full": [11, 21], "fulli": 12, "function": [2, 3, 12, 19, 22], "g": 22, "game": [5, 9, 11, 13, 17, 21], "gamma": 4, "gap": 17, "gather": [5, 14, 21], "gem": [5, 12, 21], "gener": [2, 3, 12, 21], "get": [5, 9, 11, 17], "github": 21, "give": 15, "given": [8, 9, 11, 12, 16, 17, 22], "global": [3, 8, 16], "go": [1, 5], "goal": 5, "greater": 12, "grid": [5, 9, 11, 14, 17], "ground": [6, 7, 18], "group": [5, 17], "guid": 20, "gupta_2017": 5, "gym": 3, "gymnasium": [2, 3], "ha": [2, 3, 4, 8, 9, 11, 12, 17], "handl": 4, "have": [4, 9, 10, 11, 14, 19, 22], "height": [9, 11, 17], "heintz": 14, "henc": 12, "here": [2, 19, 23], "heterogen": 10, "hiazmani": 21, "higher": 15, "hip": 15, "hold": [9, 11, 17], "home": 9, "horizont": [11, 17], "how": [1, 6, 7, 16, 18], "http": 19, "human": [2, 3, 6, 7, 10, 11, 16, 18, 19], "i": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23], "id": [8, 12, 14], "ident": 9, "idx": 4, "imag": 16, "immedi": 4, "implement": [2, 3, 21, 23], "import": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "incentiv": [9, 11], "includ": [5, 19, 20], "independ": 21, "index": [4, 9, 11, 17], "indic": [9, 11, 17, 23], "individu": [17, 23], "inf": [6, 7, 15, 18], "influenc": 5, "info": [2, 3, 19], "inform": [1, 5], "ingeni": [5, 21], "inherit": 4, "init_flying_po": [6, 7, 18], "init_target_loc": [6, 7, 18], "initi": [4, 6, 7, 8, 14, 17, 18, 22], "initial_map": 14, "inproceed": 19, "input": 4, "insert": [2, 3, 19], "insid": 22, "instal": [1, 22], "instanc": [2, 4, 12, 19], "instantan": 2, "instanti": 4, "instead": [19, 22], "int": [2, 3, 6, 7, 8, 10, 16, 18], "int32": 13, "int64": 14, "int8": [9, 11, 13, 17], "integ": [2, 3, 9, 11, 12, 14, 17], "interact": [2, 3, 19], "interest": 5, "intermedi": [7, 18], "intern": 2, "introduc": 5, "iql": 23, "isn": 12, "item": [5, 14, 21], "its": 5, "join": 19, "joint": 15, "just": 12, "kallstrom_2019": 5, "keep": [4, 5, 23], "kei": [2, 3, 4], "kept": 5, "knee": 15, "k\u00e4llstr\u00f6m": 14, "land": 11, "languag": 12, "last": [2, 8, 9, 12, 19], "latenc": 10, "launch": 21, "lead": 5, "learn": [6, 7, 10, 18, 19, 20, 21], "least": 17, "left": [8, 9, 14, 17], "length": [2, 3, 6, 7, 8, 12, 18], "less": 12, "level": [8, 15], "librari": [19, 23], "like": [2, 3, 4, 5, 17, 23], "limit": [12, 16], "linear": [4, 23], "linearizereward": [2, 4, 19], "linearreward": 3, "list": [2, 3, 23], "literatur": 5, "live": 12, "local": [8, 12, 16], "locat": [9, 11, 17], "log": 21, "look": 2, "loop": 21, "lose": [9, 11], "lost": 9, "lower": [15, 16], "made": [1, 11, 21], "mai": [2, 3], "main": [9, 11, 17, 21], "maintain": 5, "make": [1, 2, 19], "mani": 5, "mannion_2018": 5, "map": 14, "margin": 10, "markdown": 21, "marl": 5, "mass": 16, "max": 9, "max_connect": 12, "max_cycl": 16, "max_mov": 9, "max_num_ag": [2, 3], "max_prob": 12, "max_work": 12, "maxim": [5, 6, 7, 15, 18], "maximis": 16, "maximum": [8, 12, 14, 16], "mct": 10, "md": 1, "mean": [9, 11, 17], "member": [2, 3, 22], "merg": 21, "met": [6, 7, 18], "method": 22, "mgoulao": 21, "min_connect": 12, "min_prob": 12, "min_work": 12, "mine": [5, 12], "minim": [6, 7, 10, 16, 18], "minimis": 10, "minimum": [5, 12], "miss": 21, "mix": 5, "mixtur": [5, 8], "mo": [4, 5, 21], "mo_aec_to_parallel_wrapp": 4, "mo_parallel_to_aec": 22, "mo_parallel_to_aec_wrapp": 4, "moaec": 2, "moaecenv": 22, "mobeach_v0": [8, 22], "mobil": 5, "mobreakthrough_v0": 9, "mocongestion_v0": 10, "moconnect4_v0": 11, "mode": [2, 3, 5, 6, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18], "model": [2, 19], "modifi": 9, "modul": 4, "mogem_mining_v0": 12, "moingenious_v0": 13, "moitem_gathering_v0": 14, "momaland": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23], "momappo": [21, 23], "momarl": 19, "momultiwalk": 21, "momultiwalker_st": [2, 3, 19], "momultiwalker_stability_v0": [2, 3, 15, 19], "monetari": 10, "moparallel": 3, "moparallelenv": 22, "mopistonball_v0": 16, "more": [1, 2, 3, 5, 11, 19], "morl": 23, "mosame_game_v0": 17, "most": 12, "move": [4, 6, 7, 8, 9, 11, 16, 17, 18], "move_count": [9, 11], "multi": [2, 3, 5, 9, 10, 11, 14, 17, 19, 23], "multibinari": 9, "multipl": 5, "multipli": 12, "multiwalk": [5, 15, 21], "must": [2, 3, 4, 5], "n": [2, 5, 17], "n_piston": 16, "n_reward": 5, "name": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 23], "nativ": 4, "navig": 5, "ndarrai": [2, 3], "need": [10, 16], "neg": [9, 12, 14], "negat": [9, 11], "network": [2, 5, 10], "nevertheless": 23, "new": [4, 21, 22], "newli": 4, "next": [2, 16], "non": 12, "none": [2, 3, 6, 7, 8, 10, 14, 16, 18, 19], "normal": 4, "normalizereward": 4, "note": [2, 12], "notebook": [2, 19, 21], "np": [2, 3, 4, 19], "nparrai": [6, 7, 18], "nth": 2, "num_ag": [2, 3, 8, 10, 12, 17], "num_color": 17, "num_dron": [6, 7, 18], "num_intermediate_point": [7, 18], "num_object": [9, 12, 17], "num_timestep": [8, 10, 12, 14], "number": [5, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18], "numpi": [2, 3, 19], "ob": 5, "object": [2, 3, 4, 5, 8, 9, 10, 11, 12, 14, 15, 17, 19, 23], "observ": [2, 3, 13, 19, 23], "observation_spac": [2, 3], "obstyp": [2, 3], "occup": [5, 8], "occupi": 8, "occur": 14, "od": 10, "off": 5, "ol": [21, 23], "onc": 1, "one": [5, 6, 7, 9, 11, 15, 17, 18], "onli": [5, 8, 9, 17], "open": 19, "oppon": [5, 9, 11], "oppos": [2, 3], "option": [2, 3, 5, 6, 7, 9, 10, 11, 16, 18, 19], "order": [6, 7, 17, 18], "org": 19, "origin": [5, 10, 16], "other": [2, 5, 6, 7, 9, 11, 18, 23], "our": [1, 22], "outer": 21, "output": 4, "outsid": [2, 3], "over": [5, 8], "overrid": [2, 3, 4, 22], "own": [4, 5, 9, 17], "packag": [1, 5, 15, 22], "pair": 10, "paper": [5, 23], "paradox": 10, "parallel": [6, 7, 8, 10, 14, 18, 20, 22], "parallel_env": [3, 4, 22], "parallel_to_aec": 22, "parallel_wrapp": 4, "paramet": 4, "past": 4, "penal": 15, "penalti": [15, 16, 21], "per": [2, 3, 5, 12, 19], "percentag": [8, 10], "perform": 23, "pettingzoo": [2, 3, 5, 15, 19, 22], "philosophi": 23, "piec": [5, 9], "pip": [1, 19, 20, 22], "piston": 16, "piston_i": 16, "pistonbal": 5, "place": [8, 9, 10, 11, 16], "placement": [9, 11], "plai": [2, 3, 17], "plane": [9, 11, 17], "player": [5, 9, 11, 17], "player_i": [9, 11], "pleas": [12, 19], "point": [5, 7, 9, 10, 11, 17, 18], "polici": [2, 3, 4, 19, 23], "posit": [6, 7, 8, 14, 18], "position_distribut": 8, "possibl": [5, 10, 23], "possible_ag": [2, 3, 4], "practic": 22, "prefer": 10, "previou": 12, "print": [2, 3, 4], "probabl": 12, "problem": [5, 8, 14], "problem_nam": 10, "problemat": [19, 20], "producit": 5, "program": 12, "progress": [2, 3, 5], "proport": 16, "provid": [5, 12, 19, 23], "public": 19, "pure": 22, "puzzl": [5, 17], "py": 22, "pypi": 21, "pytest": 22, "python": [2, 19], "pz": [2, 3, 4, 5, 19, 22], "q": 21, "qmix": 3, "r": 1, "rack": 13, "rais": 16, "random": [8, 10, 16], "random_drop": 16, "random_toll_percentag": 10, "randomis": 14, "randomli": [8, 10, 12, 17], "rang": 4, "rather": 2, "raw_env": 22, "reach": [5, 6, 7, 8, 9, 11, 14, 16, 18], "reachabl": 12, "realli": 12, "rebuild": 1, "receiv": [3, 8, 12], "recent": 4, "record": 4, "recordepisodestatist": 4, "recordstatisticswrapp": 21, "rectangular": 17, "reflect": 5, "reimplement": 12, "reinforc": 19, "releas": 2, "remov": [2, 3, 5, 17, 21], "render": [2, 3, 6, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18], "render_mod": [2, 3, 6, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18, 19], "repositori": [19, 22], "repres": [4, 5, 6, 7, 9, 10, 11, 12, 14, 15, 17, 18], "requir": [1, 19, 20, 21], "research": 19, "reset": [2, 3, 19], "resourc": 2, "respect": [3, 5, 11], "restrict": 5, "return": [2, 3, 19, 22], "reus": 23, "reward": [2, 3, 4, 5, 13, 19, 21, 22, 23], "reward_schem": 8, "reward_spac": [2, 3, 4, 22], "rgb": 16, "rgb_arrai": [2, 3, 11, 16], "right": [5, 8, 9, 14, 16, 17], "rl": [2, 9, 11, 17, 19], "road": [5, 10], "roijer": 12, "rout": [5, 10], "routechoic": 5, "row": 9, "rradul": 21, "rule": 5, "run": [14, 22], "same": [2, 3, 5, 9, 11, 12, 17], "samegam": [5, 21], "sampl": [2, 3, 19], "scalar": [2, 3, 4, 16, 19, 23], "scale": [4, 11], "scheme": 8, "score": [5, 13], "screen": 11, "screen_scal": 11, "script": 21, "second": [2, 9, 11, 15], "section": [5, 8, 9, 11, 17], "section_capac": 8, "section_consumpt": 8, "section_id": 8, "see": [2, 3, 12, 15, 19, 20, 22], "seed": [2, 3, 12, 19, 21], "seek": 5, "select": [2, 10, 12, 17], "self": [2, 5, 22, 23], "send": 12, "separ": [5, 17], "sequenc": 11, "sequenti": 17, "server": 19, "set": [9, 11, 12, 16, 17, 19, 23], "shake": 15, "shape": [4, 6, 7, 10, 18, 22], "share": [5, 17], "shift": [2, 19], "should": [2, 6, 7, 11, 12, 18, 22], "side": [6, 7, 18], "similar": [2, 4, 19], "simpl": [2, 19], "singl": [2, 5, 9, 11, 15, 17, 19, 21, 23], "sister": 15, "size": [6, 7, 17, 18, 21], "so": [3, 4, 10], "some": [4, 19, 20], "sourc": [2, 3, 4, 6, 7, 10, 18, 19], "space": [2, 3, 4, 5, 13, 22, 23], "specif": [2, 3, 9, 11, 12, 17], "specifi": [2, 16, 22], "speed": [6, 7, 18], "sphinx": 1, "split": 4, "squar": [9, 17], "stabil": [4, 5, 21], "stai": [8, 14, 16], "stand": 11, "standard": [2, 3, 19], "start": 2, "state": [2, 3], "stateless": [10, 12], "static": 18, "statist": 4, "steadi": 5, "step": [2, 3, 6, 7, 15, 18, 19], "still": [15, 16], "store": 2, "str": [2, 3, 6, 7, 8, 10, 18], "straight": 9, "string": [2, 3], "structur": 2, "stuff": 21, "subprocess": 2, "successfulli": 11, "sum": [5, 8], "suppli": [19, 20], "support": [2, 3, 5], "surround": [5, 6], "surround_v0": 18, "survei": [2, 19], "switch": 2, "system": [19, 20], "t": [4, 12, 22], "take": [2, 3, 4, 10, 16], "taken": [2, 5], "target": [5, 6, 7, 18], "target_spe": [6, 7, 18], "tax": 10, "team": [5, 17, 23], "team_reward": 17, "tensor": [9, 11, 17], "term": 5, "termin": [2, 3, 19], "terminate_on_fal": 15, "test": [19, 20, 22], "than": 11, "thei": [5, 9, 11, 17], "them": [2, 4, 5, 9, 11, 16, 19], "themselv": 5, "therefor": [10, 12], "thi": [1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 16, 17, 18, 19, 20, 22], "third": 9, "thomasini_2023": 5, "three": 9, "threepwoodi": 21, "through": [2, 3], "tile": [5, 17], "time": [1, 2, 5, 9, 10, 11, 16], "time_penalti": 16, "timestep": [6, 7, 8, 10, 12, 14, 18], "todo": [5, 19], "togeth": 12, "token": 11, "toll": 10, "toll_mod": 10, "tool": 23, "top": [4, 11], "total": 12, "tourist": 5, "toward": [6, 7, 15, 16, 18], "trade": 5, "train": 3, "trajectori": [4, 7, 18], "transform": 4, "travel": [5, 6, 7, 10, 15, 18], "true": [12, 15, 16, 17], "trunc_prob": 12, "truncat": [2, 3, 19], "try": [6, 9, 21], "tupl": [3, 8, 14], "turn": [5, 9, 11, 17], "two": [5, 8, 9, 10, 11, 16, 17], "txt": 1, "type": [2, 3, 4, 5, 8, 12, 14], "type_distribut": 8, "typic": [2, 3], "uint8": 16, "umutucak": 21, "unchang": 16, "under": 10, "undocu": 21, "uniform": [8, 21], "until": 11, "up": [9, 14, 16], "updat": 21, "upper": 12, "us": [2, 4, 8, 10, 11, 12, 16, 19, 20, 22], "usag": [19, 20], "usual": [9, 11, 17], "util": [2, 3, 19, 22, 23], "v0": 5, "valid": 4, "valu": [2, 3, 4, 6, 7, 8, 11, 12, 15, 16, 18, 19], "variabl": 2, "varianc": 4, "variant": [5, 9, 11, 17], "vec_reward": [2, 3, 19], "vector": [2, 4, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19, 22], "vectori": 4, "veri": [2, 19], "version": [5, 10, 21, 22], "vertic": [11, 17], "via": 8, "view": 3, "villag": 12, "visual": 21, "w": 12, "w_bonu": 12, "wa": [4, 6, 7, 10, 12, 16, 18], "wai": [5, 17], "walker_0": [2, 19], "walker_1": [2, 19], "walker_2": [2, 19], "walker_i": 15, "wall": 16, "wandb": 21, "we": [2, 19, 23], "webpag": 21, "websit": 19, "weight": [2, 3, 4, 19, 21], "well": [5, 19, 22], "were": 17, "what": 21, "when": [6, 7, 11, 16, 17, 18], "where": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18, 19], "whether": [9, 11, 14, 16, 17], "which": [2, 3, 5, 6, 7, 9, 11, 12, 15, 17, 18, 19, 22], "while": [3, 5, 6, 7, 10, 18], "whose": [4, 9, 11, 17], "width": [9, 11, 17], "win": [5, 9, 11], "window": [2, 3, 16], "without": [5, 11], "work": [19, 22], "worker": 12, "workflow": 21, "world": 5, "would": [2, 3, 19], "wrapper": [5, 21, 23], "x": [9, 11, 17], "x_0": [6, 7, 18], "x_1": [6, 7, 18], "x_n": [6, 7, 18], "x_targ": [6, 7, 18], "xyz": [6, 7, 18], "y": [9, 17], "y_0": [6, 7, 18], "y_1": [6, 7, 18], "y_n": [6, 7, 18], "y_targ": [6, 7, 18], "you": [2, 3, 19, 22], "your": [1, 2, 3, 19, 22], "z": 9, "z_0": [6, 7, 18], "z_1": [6, 7, 18], "z_n": [6, 7, 18], "z_targ": [6, 7, 18], "zero": [5, 9, 11, 17]}, "titles": ["404 - Page Not Found", "MOMAland documentation", "AEC", "Parallel", "Wrappers and Utils", "All Environments", "Catch", "Escort", "MO-Beach", "MO-Breakthrough", "MO-Congestion", "MO-Connect4", "MO-GemMining", "MO-Ingenious", "MO-ItemGathering", "MO-MultiwalkerStability", "MO-Pistonball", "MO-SameGame", "Surround", "API", "Install", "Release Notes", "Making a Custom Environment", "Learning algorithms"], "titleterms": {"0": 21, "1": 21, "2": 21, "404": 0, "Not": 0, "The": 0, "action": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18], "aec": [2, 4], "algorithm": 23, "all": 5, "api": 19, "argument": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18], "attribut": [2, 3], "beach": 8, "breakthrough": 9, "build": 1, "catch": 6, "cite": 19, "commit": 22, "congest": 10, "connect4": 11, "convers": 4, "could": 0, "credit": [6, 7, 10, 12, 16, 18], "custom": 22, "document": 1, "dummi": 21, "environ": [5, 22], "episod": [6, 7, 8, 10, 12, 14, 15, 16, 18], "escort": 7, "found": 0, "gemmin": 12, "histori": [9, 11, 17], "hook": 22, "ingeni": 13, "instal": [19, 20], "itemgath": 14, "learn": 23, "legal": [9, 11, 17], "make": 22, "mask": [9, 11, 17], "method": [2, 3], "mo": [8, 9, 10, 11, 12, 13, 14, 15, 16, 17], "moaecenv": 2, "momaland": 1, "moparallelenv": 3, "multiwalkerst": 15, "note": 21, "observ": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18], "page": 0, "parallel": [3, 4], "pistonbal": 16, "pre": 22, "releas": 21, "request": 0, "reward": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18], "samegam": 17, "setup": 22, "space": [6, 7, 8, 9, 10, 11, 12, 14, 15, 16, 17, 18], "start": [6, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18], "state": [6, 7, 8, 9, 10, 11, 12, 14, 16, 17, 18], "surround": 18, "termin": [6, 7, 8, 10, 12, 14, 15, 16, 18], "truncat": [6, 7, 8, 10, 12, 14, 16, 18], "usag": [2, 3], "util": 4, "v0": 21, "version": [9, 11, 17], "wrapper": 4}}) \ No newline at end of file diff --git a/tutorials/custom_env/index.html b/tutorials/custom_env/index.html index 57810882..9ddc16ff 100644 --- a/tutorials/custom_env/index.html +++ b/tutorials/custom_env/index.html @@ -232,7 +232,6 @@
    • MO-GemMining
    • MO-Ingenious
    • MO-ItemGathering
    • -
    • MO-Multiwalker
    • MO-MultiwalkerStability
    • MO-Pistonball
    • MO-SameGame
    • @@ -422,7 +421,7 @@

      Setup pre-commit hooks + diff --git a/tutorials/learning_algorithms/index.html b/tutorials/learning_algorithms/index.html index 302cf7d1..635a831d 100644 --- a/tutorials/learning_algorithms/index.html +++ b/tutorials/learning_algorithms/index.html @@ -232,7 +232,6 @@
    • MO-GemMining
    • MO-Ingenious
    • MO-ItemGathering
    • -
    • MO-Multiwalker
    • MO-MultiwalkerStability
    • MO-Pistonball
    • MO-SameGame
    • @@ -334,6 +333,30 @@

      Learning algorithms

      Scalarized IQL

      +

      Single

      +

      Individual

      +

      Individual / Linear

      +

      Discrete

      +

      Discrete

      +

      + +

      Centralization wrapper

      +

      Any

      +

      Team

      +

      Team / Any

      +

      Discrete

      +

      Discrete

      +

      + +

      Linearization wrapper

      +

      Single

      +

      Any

      +

      Individual / Linear

      +

      Any

      +

      Any

      +

      +

    @@ -425,7 +448,7 @@

    Learning algorithms +