From 999b93c673c4a2518228f3e85ee5f7e16005802f Mon Sep 17 00:00:00 2001 From: ffelten Date: Mon, 4 Mar 2024 10:17:59 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Farama-F?= =?UTF-8?q?oundation/momaland@c5ffc3361444202bf7bbe7e8dfc99d2957bcf027=20?= =?UTF-8?q?=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .buildinfo | 2 +- environments/momultiwalker_stability/index.html | 15 ++++++++++----- searchindex.js | 2 +- 3 files changed, 12 insertions(+), 7 deletions(-) diff --git a/.buildinfo b/.buildinfo index 3a3c6581..b986b017 100644 --- a/.buildinfo +++ b/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: 92f91e2f517770ebc017784489e6c06e +config: 479e3b211f8dbf0073d98f35c52899c9 tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/environments/momultiwalker_stability/index.html b/environments/momultiwalker_stability/index.html index 3f1972b4..aa9361b1 100644 --- a/environments/momultiwalker_stability/index.html +++ b/environments/momultiwalker_stability/index.html @@ -317,7 +317,7 @@

MO-MultiwalkerStability

Box(-inf, inf, (31,), float32)

Reward Space

-

Box([-2.100e+02 -1.567e-02], [0.46 0. ], (2,), float32)

+

Box([-2.100e+02 -1.567e-02], [-209.54 0. ], (2,), float32)

Import

momaland.envs.momultiwalker_stability_v0

@@ -337,14 +337,19 @@

Action Space

Reward Space#

-

The reward space is a 2D vector where; the first value contains the sum of following rewards:

+

The reward space is a 2D vector where; the first value contains the following reward:

  • Maximizing distance traveled towards the end of the level during one step. [-0.46, 0.46]

  • -
  • Penalty for agent falling. [-110, 0]

  • -
  • Penalty for the package falling. [-100, 0] -and the second value contains:

  • +
+

and the second value contains:

+
  • A penalty based on the change of angle of the package, to avoid shaking the package. [-0.01567, 0]

+

Both these objectives are penalized with:

+
    +
  • Penalty for agent falling. [-110, 0]

  • +
  • Penalty for the package falling. [-100, 0]

  • +

Episode Termination#

diff --git a/searchindex.js b/searchindex.js index 2561445d..c5f0002f 100644 --- a/searchindex.js +++ b/searchindex.js @@ -1 +1 @@ -Search.setIndex({"docnames": ["404", "README", "api/aec", "api/parallel", "api/wrappers", "environments/all-envs", "environments/catch", "environments/escort", "environments/mobeach", "environments/mobreakthrough", "environments/mocongestion", "environments/moconnect4", "environments/mogem_mining", "environments/moingenious", "environments/moitem_gathering", "environments/momultiwalker", "environments/momultiwalker_stability", "environments/mopistonball", "environments/mosame_game", "environments/surround", "index", "introduction/install", "release_notes", "tutorials/custom_env", "tutorials/learning_algorithms"], "filenames": ["404.md", "README.md", "api/aec.md", "api/parallel.md", "api/wrappers.md", "environments/all-envs.md", "environments/catch.md", "environments/escort.md", "environments/mobeach.md", "environments/mobreakthrough.md", "environments/mocongestion.md", "environments/moconnect4.md", "environments/mogem_mining.md", "environments/moingenious.md", "environments/moitem_gathering.md", "environments/momultiwalker.md", "environments/momultiwalker_stability.md", "environments/mopistonball.md", "environments/mosame_game.md", "environments/surround.md", "index.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "tutorials/learning_algorithms.md"], "titles": ["404 - Page Not Found", "MOMAland documentation", "AEC", "Parallel", "Wrappers and Utils", "All Environments", "Catch", "Escort", "MO-Beach", "MO-Breakthrough", "MO-Congestion", "MO-Connect4", "MO-GemMining", "MO-Ingenious", "MO-ItemGathering", "MO-Multiwalker", "MO-MultiwalkerStability", "MO-Pistonball", "MO-SameGame", "Surround", "API", "Install", "Release Notes", "Making a Custom Environment", "Learning algorithms"], "terms": {"thi": [1, 2, 3, 4, 6, 7, 19, 20, 21, 23], "folder": 1, "contain": [1, 2, 6, 7, 15, 16, 19, 24], "For": [1, 2, 3, 4, 20], "more": [1, 2, 3, 20], "inform": 1, "about": 1, "how": [1, 6, 7, 19], "contribut": 1, "go": 1, "our": [1, 23], "md": 1, "instal": [1, 23], "requir": [1, 20, 21], "packag": [1, 15, 16, 23], "your": [1, 2, 3, 20, 23], "fork": 1, "pip": [1, 20, 21, 23], "r": 1, "doc": 1, "txt": 1, "e": [1, 2, 3, 23], "To": [1, 20, 21, 24], "onc": 1, "cd": 1, "make": [1, 2, 20], "dirhtml": 1, "rebuild": 1, "automat": [1, 2], "everi": [1, 2, 3], "time": [1, 2], "chang": [1, 2, 3, 4, 8, 10, 12, 14, 16], "i": [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24], "made": 1, "sphinx": 1, "autobuild": 1, "b": 1, "_build": 1, "similar": [2, 4, 20], "pettingzoo": [2, 3, 5, 15, 16, 20, 23], "momaland": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24], "api": [2, 3, 4, 21], "model": [2, 20], "environ": [2, 3, 4, 6, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 24], "simpl": [2, 20], "python": [2, 20], "env": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 23], "class": [2, 3, 4, 20, 23], "creat": [2, 20, 23], "instanc": [2, 4, 20], "interact": [2, 3, 20], "them": [2, 4, 20], "veri": [2, 20], "here": [2, 20, 24], "": [2, 3, 4, 6, 7, 19, 20, 24], "an": [2, 3, 4, 6, 7, 15, 19, 20, 23], "exampl": [2, 4, 6, 7, 19, 20, 23], "us": [2, 4, 20, 21, 23], "momultiwalker_v0": [2, 3, 15, 20], "from": [2, 3, 5, 6, 7, 16, 19, 20, 23, 24], "momultiwalk": [2, 3, 20], "import": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "_env": [2, 3, 20], "numpi": [2, 3, 20], "np": [2, 3, 4, 20], "function": [2, 3, 20, 23], "return": [2, 3, 20, 23], "per": [2, 3, 20], "pz": [2, 3, 4, 20, 23], "standard": [2, 3, 20], "render_mod": [2, 3, 6, 7, 19, 20], "human": [2, 3, 6, 7, 19, 20], "reset": [2, 3, 20], "seed": [2, 3, 20], "42": [2, 3, 20], "agent": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 23], "agent_it": [2, 20], "vec_reward": [2, 3, 20], "arrai": [2, 3, 4, 6, 7, 19, 20], "observ": [2, 3, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 24], "termin": [2, 3, 20], "truncat": [2, 3, 20], "info": [2, 3, 20], "last": [2, 20], "action": [2, 3, 5, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 24], "none": [2, 3, 6, 7, 19, 20], "els": [2, 20], "action_spac": [2, 3, 8, 10, 12, 14, 20], "sampl": [2, 3, 20], "where": [2, 3, 4, 6, 7, 16, 19, 20], "you": [2, 3, 20, 23], "would": [2, 3, 20], "insert": [2, 3, 20], "polici": [2, 3, 4, 20, 24], "step": [2, 3, 6, 7, 15, 16, 19, 20], "close": [2, 3, 20, 24], "option": [2, 3, 6, 7, 19, 20], "can": [2, 3, 4, 6, 7, 19, 20, 21], "scalar": [2, 3, 4, 20], "reward": [2, 3, 4, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 23, 24], "weight": [2, 3, 4, 20], "vector": [2, 4, 6, 7, 15, 16, 19, 20, 23], "shift": [2, 20], "singl": [2, 15, 16, 20, 24], "object": [2, 3, 4, 5, 9, 11, 13, 17, 18, 20, 24], "multi": [2, 3, 5, 9, 11, 13, 17, 20, 24], "aka": [2, 20], "we": [2, 20, 24], "assign": [2, 20], "differ": [2, 20], "each": [2, 3, 4, 6, 7, 19, 20, 23, 24], "walker_0": [2, 20], "0": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "1": [2, 4, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "7": [2, 11, 12, 20], "2": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20], "walker_1": [2, 20], "6": [2, 3, 11, 12, 13, 17, 20], "3": [2, 6, 7, 8, 10, 12, 14, 15, 17, 19, 20], "walker_2": [2, 20], "linearizereward": [2, 4, 20], "detail": [2, 3, 20], "rl": [2, 20], "definit": [2, 20], "see": [2, 3, 15, 16, 20, 21, 23], "decis": [2, 20], "A": [2, 3, 4, 6, 7, 16, 17, 19, 20], "util": [2, 3, 20, 23, 24], "base": [2, 3, 4, 16, 20], "analysi": [2, 20], "survei": [2, 20], "also": [2, 4, 20], "check": [2, 4, 20, 22, 23], "colab": [2, 20], "notebook": [2, 20], "extend": [2, 3, 23], "moaec": 2, "oppos": [2, 3], "ha": [2, 3, 4], "reward_spac": [2, 3, 4, 23], "member": [2, 3, 23], "document": [2, 3, 15, 16, 20, 21, 23], "sourc": [2, 3, 4, 6, 7, 19, 20], "overrid": [2, 3, 4, 23], "type": [2, 3, 4], "enforc": [2, 3], "list": [2, 3, 24], "agentid": [2, 3], "name": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 24], "all": [2, 3, 20, 21], "current": [2, 3, 24], "typic": [2, 3], "integ": [2, 3], "These": [2, 3, 8, 10, 12, 14], "mai": [2, 3], "progress": [2, 3], "ad": [2, 3], "remov": [2, 3], "num_ag": [2, 3], "The": [2, 3, 4, 6, 7, 8, 10, 12, 14, 15, 16, 19, 20, 24], "length": [2, 3, 6, 7, 19], "possible_ag": [2, 3, 4, 8, 10, 12, 14], "could": [2, 3], "gener": [2, 3], "equival": [2, 3], "space": [2, 3, 4, 5, 8, 9, 10, 11, 12, 13, 14, 17, 18, 23, 24], "cannot": [2, 3], "through": [2, 3], "plai": [2, 3], "max_num_ag": [2, 3], "agent_select": 2, "correspond": 2, "select": 2, "taken": [2, 5], "dict": [2, 3, 4, 9, 11, 13, 18], "bool": [2, 3], "ndarrai": [2, 3], "ani": [2, 24], "dtype": 2, "_scalartype_co": 2, "call": 2, "kei": [2, 3, 4], "instantan": 2, "after": [2, 8, 10, 12, 14], "accumul": 2, "note": 2, "doe": [2, 20, 21], "directli": 2, "access": [2, 4], "rather": 2, "store": 2, "intern": 2, "variabl": 2, "structur": 2, "look": 2, "like": [2, 3, 4, 24], "first": [2, 16], "second": [2, 16], "n": 2, "nth": 2, "float": [2, 3, 4, 6, 7, 19], "str": [2, 3, 6, 7, 19], "observation_spac": [2, 3, 8, 10, 12, 14], "gymnasium": [2, 3], "actiontyp": [2, 3], "accept": 2, "execut": [2, 3], "switch": 2, "control": 2, "next": 2, "int": [2, 3, 6, 7, 19], "start": [2, 12, 14], "state": [2, 3], "obstyp": [2, 3], "render": [2, 3, 6, 7, 19], "specifi": [2, 23], "self": [2, 23, 24], "mode": [2, 3, 6, 7, 19], "displai": [2, 3, 6, 7, 19], "window": [2, 3], "other": [2, 6, 7, 19, 24], "default": [2, 3, 15, 16], "ar": [2, 3, 4, 6, 7, 19, 23, 24], "rgb_arrai": [2, 3], "which": [2, 3, 6, 7, 16, 19, 20, 23], "support": [2, 3], "outsid": [2, 3], "classic": [2, 3], "ansi": [2, 3], "string": [2, 3], "print": [2, 3, 4], "specif": [2, 3], "resourc": 2, "should": [2, 6, 7, 8, 10, 12, 14, 19, 23], "releas": 2, "subprocess": 2, "network": 2, "connect": [2, 11], "take": [2, 3, 4, 8, 10, 12, 14], "must": [2, 3, 4, 5], "same": [2, 3, 5], "valu": [2, 3, 4, 6, 7, 16, 19, 20], "implement": [2, 3, 24], "follow": [3, 6, 7, 8, 10, 12, 14, 16, 19, 20], "parallel_env": [3, 4, 23], "linearreward": 3, "while": [3, 5, 6, 7, 19], "In": 3, "etc": 3, "respect": 3, "data": 3, "so": [3, 4], "moparallel": 3, "gym": 3, "tupl": [3, 14], "receiv": 3, "dictionari": [3, 23], "And": 3, "frame": 3, "altern": 3, "global": 3, "view": 3, "appropri": 3, "central": 3, "train": 3, "decentr": 3, "qmix": 3, "transform": 4, "input": 4, "output": 4, "new": [4, 23], "some": [4, 20, 21], "valid": 4, "appli": 4, "between": [4, 5, 20], "nativ": 4, "On": 4, "top": 4, "few": 4, "split": 4, "own": 4, "modul": 4, "parallel_wrapp": 4, "mo_aec_to_parallel_wrapp": 4, "aec_env": 4, "convert": 4, "behavior": 4, "handl": 4, "vectori": 4, "keep": [4, 24], "inherit": 4, "avoid": [4, 6, 7, 16, 19], "code": [4, 6, 7, 19], "duplic": 4, "mo": [4, 5], "mo_parallel_to_aec_wrapp": 4, "aec_wrapp": 4, "repres": [4, 6, 7, 15, 16, 19], "agent_0": 4, "9": [4, 11, 12], "agent_1": 4, "8": [4, 9, 12, 14, 17], "linear": [4, 24], "initi": [4, 6, 7, 8, 10, 12, 14, 19, 23], "paramet": 4, "add": [4, 23], "normalizereward": 4, "idx": 4, "gamma": 4, "99": [4, 8], "epsilon": 4, "1e": 4, "08": 4, "normal": 4, "immedi": 4, "t": [4, 23], "exponenti": 4, "move": [4, 6, 7, 19], "averag": [4, 6, 7, 19], "fix": [4, 5], "varianc": 4, "have": [4, 20, 23], "scale": 4, "depend": [4, 20, 21], "past": 4, "trajectori": [4, 7, 19], "correctli": 4, "wa": [4, 6, 7, 19], "newli": 4, "instanti": 4, "recent": 4, "rang": 4, "shape": [4, 6, 7, 19, 23], "aecwrapp": 4, "whose": 4, "index": 4, "stabil": 4, "discount": 4, "factor": 4, "recordepisodestatist": 4, "record": 4, "episod": 4, "statist": 4, "end": [4, 15, 16], "includ": [5, 20, 21], "marl": 5, "literatur": 5, "well": [5, 20, 23], "version": [5, 17, 22, 23], "cooper": 5, "adversari": 5, "ob": 5, "descript": 5, "catch": 5, "v0": 5, "continu": [5, 6, 7, 15, 16, 19, 24], "distance_target": 5, "distance_other_dron": 5, "corner": 5, "target": [5, 6, 7, 19], "drone": [5, 6, 7, 19], "maintain": 5, "distanc": [5, 6, 7, 15, 16, 19], "themselv": 5, "escort": 5, "circl": 5, "around": 5, "mobil": 5, "its": 5, "destin": 5, "without": 5, "break": 5, "format": 5, "surround": [5, 6], "point": [5, 7, 19], "beach": 5, "discret": [5, 8, 9, 10, 11, 12, 13, 14, 18, 24], "todo": [5, 20], "breakthrough": 5, "congest": 5, "connect4": 5, "gem": 5, "mine": 5, "ingeni": 5, "item": 5, "gather": 5, "multiwalk": [5, 16], "pistonbal": 5, "game": [5, 13], "agent_i": [6, 7, 8, 10, 12, 13, 14, 18, 19], "box": [6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "float32": [6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "15": [6, 7, 12, 13, 18, 19], "10": [6, 7, 12, 19], "inf": [6, 7, 15, 16, 19], "catch_v0": 6, "parallel": [6, 7, 19, 21, 23], "learn": [6, 7, 19, 20, 21], "try": [6, 22], "escap": 6, "num_dron": [6, 7, 19], "xyz": [6, 7, 19], "coordin": [6, 7, 19, 20], "order": [6, 7, 19], "x_0": [6, 7, 19], "y_0": [6, 7, 19], "z_0": [6, 7, 19], "x_targ": [6, 7, 19], "y_targ": [6, 7, 19], "z_targ": [6, 7, 19], "x_1": [6, 7, 19], "y_1": [6, 7, 19], "z_1": [6, 7, 19], "x_n": [6, 7, 19], "y_n": [6, 7, 19], "z_n": [6, 7, 19], "3d": [6, 7, 15, 19], "speed": [6, 7, 19], "direct": [6, 7, 19], "2d": [6, 7, 16, 19], "minim": [6, 7, 19], "toward": [6, 7, 15, 16, 19], "maxim": [6, 7, 15, 16, 19], "collis": [6, 7, 19], "size": [6, 7, 19], "posit": [6, 7, 19], "5": [6, 7, 8, 12, 14, 18, 19], "one": [6, 7, 15, 16, 19], "condit": [6, 7, 19], "met": [6, 7, 19], "collid": [6, 7, 19], "ground": [6, 7, 19], "when": [6, 7, 19], "reach": [6, 7, 19], "200": [6, 7, 19], "area": [6, 7, 19], "side": [6, 7, 19], "amount": [6, 7, 19], "init_flying_po": [6, 7, 19], "nparrai": [6, 7, 19], "init_target_loc": [6, 7, 19], "target_spe": [6, 7, 19], "travel": [6, 7, 15, 16, 19], "timestep": [6, 7, 19], "adapt": [6, 7, 15, 16, 19], "felten": [6, 7, 19], "escort_v0": 7, "final_target_loc": [7, 19], "final": [7, 19], "num_intermediate_point": [7, 19], "number": [7, 19], "intermedi": [7, 19], "100": [8, 15, 16, 17], "18": [8, 12, 13], "73087": 8, "mobeach_v0": [8, 23], "beachdomain": 8, "problem": [8, 10, 14], "init": [8, 10, 12, 14], "method": [8, 10, 12, 14, 23], "argument": [8, 10, 12, 14], "defin": [8, 10, 12, 14, 23], "attribut": [8, 10, 12, 14], "player_i": [9, 11], "192": 9, "action_mask": [9, 11, 13, 18], "multibinari": 9, "int8": [9, 11, 13, 18], "4": [9, 12, 15, 16], "mobreakthrough_v0": 9, "4199": 10, "4200": 10, "mocongestion_v0": 10, "moconnect4_v0": 11, "four": 11, "19": [12, 17], "11": 12, "12": [12, 22], "13": 12, "14": 12, "16": 12, "17": 12, "20": [12, 22], "23": 12, "mogem_mining_v0": 12, "domain": 12, "5544": 13, "board": 13, "score": 13, "int32": 13, "tile": 13, "moingenious_v0": 13, "int64": 14, "moitem_gathering_v0": 14, "walker_i": [15, 16], "31": [15, 16], "46666667": 15, "110": [15, 16], "forc": [15, 16], "exert": [15, 16], "avail": [15, 16], "joint": [15, 16], "hip": [15, 16], "knee": [15, 16], "give": [15, 16], "element": [15, 16], "higher": [15, 16], "bound": [15, 16], "lower": [15, 16], "level": [15, 16], "dure": [15, 16], "46": [15, 16], "penalti": [15, 16], "fall": [15, 16], "drop": [15, 16], "If": [15, 16, 20], "terminate_on_fal": [15, 16], "true": [15, 16], "even": [15, 16], "still": [15, 16], "aliv": [15, 16], "100e": 16, "02": 16, "567e": 16, "momultiwalker_stability_v0": 16, "sister": 16, "sum": 16, "angl": 16, "shake": 16, "01567": 16, "piston_i": 17, "255": 17, "457": 17, "120": 17, "uint8": 17, "79e": 17, "04": 17, "00e": 17, "01": 17, "60": 17, "mopistonball_v0": 17, "225": 18, "50625": 18, "mosame_game_v0": 18, "multipl": 18, "surround_v0": 19, "static": 19, "reinforc": 20, "momarl": 20, "open": 20, "librari": [20, 24], "develop": 20, "compar": 20, "algorithm": [20, 21], "provid": [20, 24], "commun": 20, "set": [20, 24], "compliant": 20, "essenti": 20, "instead": [20, 23], "websit": 20, "public": 20, "discord": 20, "server": 20, "work": [20, 23], "join": 20, "aec": [20, 21, 23], "compon": [20, 21], "everyth": [20, 21, 23, 24], "basic": [20, 21], "usag": [20, 21], "problemat": [20, 21], "certain": [20, 21], "system": [20, 21], "test": [20, 21, 23], "suppli": [20, 21], "repositori": [20, 23], "research": 20, "pleas": 20, "inproceed": 20, "guid": 21, "2023": 22, "github": 22, "pypi": 22, "bump": 22, "workflow": 22, "don": 23, "env_nam": 23, "py": 23, "moparallelenv": 23, "moaecenv": 23, "addition": 23, "given": 23, "factori": 23, "raw_env": 23, "pure": 23, "constructor": 23, "practic": 23, "convers": 23, "insid": 23, "g": 23, "mo_parallel_to_aec": 23, "parallel_to_aec": 23, "directori": [23, 24], "export": 23, "all_modul": 23, "run": 23, "pytest": 23, "compat": 24, "possibl": 24, "file": 24, "cleanrl": 24, "philosophi": 24, "nevertheless": 24, "reus": 24, "tool": 24, "evalu": 24, "perform": 24, "indic": 24, "morl": 24, "baselin": 24, "paper": 24, "momappo": 24, "ol": 24, "team": 24}, "objects": {"momaland.utils.aec_wrappers": [[4, 0, 1, "", "LinearizeReward"], [4, 0, 1, "", "NormalizeReward"]], "momaland.utils.conversions": [[4, 0, 1, "", "mo_aec_to_parallel_wrapper"], [4, 0, 1, "", "mo_parallel_to_aec_wrapper"]], "momaland.utils.env": [[2, 0, 1, "", "MOAECEnv"], [3, 0, 1, "", "MOParallelEnv"]], "momaland.utils.env.MOAECEnv": [[2, 1, 1, "", "action_space"], [2, 2, 1, "", "action_spaces"], [2, 2, 1, "", "agent_selection"], [2, 2, 1, "", "agents"], [2, 1, 1, "", "close"], [2, 2, 1, "", "infos"], [2, 2, 1, "", "max_num_agents"], [2, 2, 1, "", "num_agents"], [2, 1, 1, "", "observation_space"], [2, 2, 1, "", "observation_spaces"], [2, 1, 1, "", "observe"], [2, 2, 1, "", "possible_agents"], [2, 1, 1, "", "render"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "reward_space"], [2, 2, 1, "", "reward_spaces"], [2, 2, 1, "", "rewards"], [2, 1, 1, "", "step"], [2, 2, 1, "", "terminations"], [2, 2, 1, "", "truncations"]], "momaland.utils.env.MOParallelEnv": [[3, 1, 1, "", "action_space"], [3, 2, 1, "", "action_spaces"], [3, 2, 1, "", "agents"], [3, 1, 1, "", "close"], [3, 2, 1, "", "max_num_agents"], [3, 2, 1, "", "num_agents"], [3, 1, 1, "", "observation_space"], [3, 2, 1, "", "observation_spaces"], [3, 2, 1, "", "possible_agents"], [3, 1, 1, "", "render"], [3, 1, 1, "", "reset"], [3, 1, 1, "", "reward_space"], [3, 2, 1, "", "reward_spaces"], [3, 1, 1, "", "state"], [3, 1, 1, "", "step"]], "momaland.utils.parallel_wrappers": [[4, 0, 1, "", "LinearizeReward"], [4, 0, 1, "", "NormalizeReward"], [4, 0, 1, "", "RecordEpisodeStatistics"]]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute"}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"]}, "titleterms": {"404": 0, "page": 0, "Not": 0, "found": 0, "The": 0, "request": 0, "could": 0, "momaland": 1, "document": 1, "build": 1, "aec": [2, 4], "usag": [2, 3], "moaecenv": 2, "attribut": [2, 3], "method": [2, 3], "parallel": [3, 4], "moparallelenv": 3, "wrapper": 4, "util": 4, "convers": 4, "all": 5, "environ": [5, 23], "catch": 6, "observ": [6, 7, 15, 16, 19], "space": [6, 7, 15, 16, 19], "action": [6, 7, 15, 16, 19], "reward": [6, 7, 15, 16, 19], "start": [6, 7, 19], "state": [6, 7, 19], "episod": [6, 7, 15, 16, 19], "termin": [6, 7, 15, 16, 19], "truncat": [6, 7, 19], "argument": [6, 7, 15, 16, 19], "credit": [6, 7, 19], "escort": 7, "mo": [8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18], "beach": 8, "breakthrough": 9, "congest": 10, "connect4": 11, "gemmin": 12, "ingeni": 13, "itemgath": 14, "multiwalk": 15, "multiwalkerst": 16, "pistonbal": 17, "samegam": 18, "surround": 19, "api": 20, "instal": [20, 21], "cite": 20, "releas": 22, "note": 22, "v0": 22, "0": 22, "2": 22, "dummi": 22, "1": 22, "make": 23, "custom": 23, "setup": 23, "pre": 23, "commit": 23, "hook": 23, "learn": 24, "algorithm": 24}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1, "sphinx": 60}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "MOMAland documentation": [[1, "momaland-documentation"]], "Build the Documentation": [[1, "build-the-documentation"]], "AEC": [[2, "aec"], [4, "aec"]], "Usage": [[2, "usage"], [3, "usage"]], "MOAECEnv": [[2, "moaecenv"]], "Attributes": [[2, "attributes"], [3, "attributes"]], "Methods": [[2, "methods"], [3, "methods"]], "Parallel": [[3, "parallel"], [4, "parallel"]], "MOParallelEnv": [[3, "moparallelenv"]], "Wrappers and Utils": [[4, "wrappers-and-utils"]], "Conversion": [[4, "conversion"]], "AEC to Parallel": [[4, "aec-to-parallel"]], "Parallel to AEC": [[4, "parallel-to-aec"]], "All Environments": [[5, "all-environments"]], "Catch": [[6, "catch"]], "Observation Space": [[6, "observation-space"], [7, "observation-space"], [15, "observation-space"], [16, "observation-space"], [19, "observation-space"]], "Action Space": [[6, "action-space"], [7, "action-space"], [15, "action-space"], [16, "action-space"], [19, "action-space"]], "Reward Space": [[6, "reward-space"], [7, "reward-space"], [15, "reward-space"], [16, "reward-space"], [19, "reward-space"]], "Starting State": [[6, "starting-state"], [7, "starting-state"], [19, "starting-state"]], "Episode Termination": [[6, "episode-termination"], [7, "episode-termination"], [15, "episode-termination"], [16, "episode-termination"], [19, "episode-termination"]], "Episode Truncation": [[6, "episode-truncation"], [7, "episode-truncation"], [19, "episode-truncation"]], "Arguments": [[6, "arguments"], [7, "arguments"], [15, "arguments"], [16, "arguments"], [19, "arguments"]], "Credits": [[6, "credits"], [7, "credits"], [19, "credits"]], "Escort": [[7, "escort"]], "MO-Beach": [[8, "mo-beach"]], "MO-Breakthrough": [[9, "mo-breakthrough"]], "MO-Congestion": [[10, "mo-congestion"]], "MO-Connect4": [[11, "mo-connect4"]], "MO-GemMining": [[12, "mo-gemmining"]], "MO-Ingenious": [[13, "mo-ingenious"]], "MO-ItemGathering": [[14, "mo-itemgathering"]], "MO-Multiwalker": [[15, "mo-multiwalker"]], "MO-MultiwalkerStability": [[16, "mo-multiwalkerstability"]], "MO-Pistonball": [[17, "mo-pistonball"]], "MO-SameGame": [[18, "mo-samegame"]], "Surround": [[19, "surround"]], "API": [[20, "api"]], "Install": [[20, "install"], [21, "install"]], "Citing": [[20, "citing"]], "Release Notes": [[22, "release-notes"]], "v0.0.2: Dummy release 2": [[22, "release-v0-0-2"]], "v0.0.1: Dummy release": [[22, "release-v0-0-1"]], "Making a Custom Environment": [[23, "making-a-custom-environment"]], "Setup pre-commit hooks": [[23, "setup-pre-commit-hooks"]], "Learning algorithms": [[24, "learning-algorithms"]]}, "indexentries": {"moaecenv (class in momaland.utils.env)": [[2, "momaland.utils.env.MOAECEnv"]], "action_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.action_space"]], "action_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.action_spaces"]], "agent_selection (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.agent_selection"]], "agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.agents"]], "close() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.close"]], "infos (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.infos"]], "max_num_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.max_num_agents"]], "num_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.num_agents"]], "observation_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.observation_space"]], "observation_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.observation_spaces"]], "observe() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.observe"]], "possible_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.possible_agents"]], "render() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.render"]], "reset() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.reset"]], "reward_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.reward_space"]], "reward_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.reward_spaces"]], "rewards (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.rewards"]], "step() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.step"]], "terminations (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.terminations"]], "truncations (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.truncations"]], "moparallelenv (class in momaland.utils.env)": [[3, "momaland.utils.env.MOParallelEnv"]], "action_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.action_space"]], "action_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.action_spaces"]], "agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.agents"]], "close() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.close"]], "max_num_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.max_num_agents"]], "num_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.num_agents"]], "observation_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.observation_space"]], "observation_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.observation_spaces"]], "possible_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.possible_agents"]], "render() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.render"]], "reset() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.reset"]], "reward_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.reward_space"]], "reward_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.reward_spaces"]], "state() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.state"]], "step() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.step"]], "linearizereward (class in momaland.utils.aec_wrappers)": [[4, "momaland.utils.aec_wrappers.LinearizeReward"]], "linearizereward (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.LinearizeReward"]], "normalizereward (class in momaland.utils.aec_wrappers)": [[4, "momaland.utils.aec_wrappers.NormalizeReward"]], "normalizereward (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.NormalizeReward"]], "recordepisodestatistics (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.RecordEpisodeStatistics"]], "mo_aec_to_parallel_wrapper (class in momaland.utils.conversions)": [[4, "momaland.utils.conversions.mo_aec_to_parallel_wrapper"]], "mo_parallel_to_aec_wrapper (class in momaland.utils.conversions)": [[4, "momaland.utils.conversions.mo_parallel_to_aec_wrapper"]]}}) \ No newline at end of file +Search.setIndex({"docnames": ["404", "README", "api/aec", "api/parallel", "api/wrappers", "environments/all-envs", "environments/catch", "environments/escort", "environments/mobeach", "environments/mobreakthrough", "environments/mocongestion", "environments/moconnect4", "environments/mogem_mining", "environments/moingenious", "environments/moitem_gathering", "environments/momultiwalker", "environments/momultiwalker_stability", "environments/mopistonball", "environments/mosame_game", "environments/surround", "index", "introduction/install", "release_notes", "tutorials/custom_env", "tutorials/learning_algorithms"], "filenames": ["404.md", "README.md", "api/aec.md", "api/parallel.md", "api/wrappers.md", "environments/all-envs.md", "environments/catch.md", "environments/escort.md", "environments/mobeach.md", "environments/mobreakthrough.md", "environments/mocongestion.md", "environments/moconnect4.md", "environments/mogem_mining.md", "environments/moingenious.md", "environments/moitem_gathering.md", "environments/momultiwalker.md", "environments/momultiwalker_stability.md", "environments/mopistonball.md", "environments/mosame_game.md", "environments/surround.md", "index.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "tutorials/learning_algorithms.md"], "titles": ["404 - Page Not Found", "MOMAland documentation", "AEC", "Parallel", "Wrappers and Utils", "All Environments", "Catch", "Escort", "MO-Beach", "MO-Breakthrough", "MO-Congestion", "MO-Connect4", "MO-GemMining", "MO-Ingenious", "MO-ItemGathering", "MO-Multiwalker", "MO-MultiwalkerStability", "MO-Pistonball", "MO-SameGame", "Surround", "API", "Install", "Release Notes", "Making a Custom Environment", "Learning algorithms"], "terms": {"thi": [1, 2, 3, 4, 6, 7, 19, 20, 21, 23], "folder": 1, "contain": [1, 2, 6, 7, 15, 16, 19, 24], "For": [1, 2, 3, 4, 20], "more": [1, 2, 3, 20], "inform": 1, "about": 1, "how": [1, 6, 7, 19], "contribut": 1, "go": 1, "our": [1, 23], "md": 1, "instal": [1, 23], "requir": [1, 20, 21], "packag": [1, 15, 16, 23], "your": [1, 2, 3, 20, 23], "fork": 1, "pip": [1, 20, 21, 23], "r": 1, "doc": 1, "txt": 1, "e": [1, 2, 3, 23], "To": [1, 20, 21, 24], "onc": 1, "cd": 1, "make": [1, 2, 20], "dirhtml": 1, "rebuild": 1, "automat": [1, 2], "everi": [1, 2, 3], "time": [1, 2], "chang": [1, 2, 3, 4, 8, 10, 12, 14, 16], "i": [1, 2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24], "made": 1, "sphinx": 1, "autobuild": 1, "b": 1, "_build": 1, "similar": [2, 4, 20], "pettingzoo": [2, 3, 5, 15, 16, 20, 23], "momaland": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24], "api": [2, 3, 4, 21], "model": [2, 20], "environ": [2, 3, 4, 6, 7, 8, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 24], "simpl": [2, 20], "python": [2, 20], "env": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 23], "class": [2, 3, 4, 20, 23], "creat": [2, 20, 23], "instanc": [2, 4, 20], "interact": [2, 3, 20], "them": [2, 4, 20], "veri": [2, 20], "here": [2, 20, 24], "": [2, 3, 4, 6, 7, 19, 20, 24], "an": [2, 3, 4, 6, 7, 15, 19, 20, 23], "exampl": [2, 4, 6, 7, 19, 20, 23], "us": [2, 4, 20, 21, 23], "momultiwalker_v0": [2, 3, 15, 20], "from": [2, 3, 5, 6, 7, 16, 19, 20, 23, 24], "momultiwalk": [2, 3, 20], "import": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "_env": [2, 3, 20], "numpi": [2, 3, 20], "np": [2, 3, 4, 20], "function": [2, 3, 20, 23], "return": [2, 3, 20, 23], "per": [2, 3, 20], "pz": [2, 3, 4, 20, 23], "standard": [2, 3, 20], "render_mod": [2, 3, 6, 7, 19, 20], "human": [2, 3, 6, 7, 19, 20], "reset": [2, 3, 20], "seed": [2, 3, 20], "42": [2, 3, 20], "agent": [2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 23], "agent_it": [2, 20], "vec_reward": [2, 3, 20], "arrai": [2, 3, 4, 6, 7, 19, 20], "observ": [2, 3, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 24], "termin": [2, 3, 20], "truncat": [2, 3, 20], "info": [2, 3, 20], "last": [2, 20], "action": [2, 3, 5, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 24], "none": [2, 3, 6, 7, 19, 20], "els": [2, 20], "action_spac": [2, 3, 8, 10, 12, 14, 20], "sampl": [2, 3, 20], "where": [2, 3, 4, 6, 7, 16, 19, 20], "you": [2, 3, 20, 23], "would": [2, 3, 20], "insert": [2, 3, 20], "polici": [2, 3, 4, 20, 24], "step": [2, 3, 6, 7, 15, 16, 19, 20], "close": [2, 3, 20, 24], "option": [2, 3, 6, 7, 19, 20], "can": [2, 3, 4, 6, 7, 19, 20, 21], "scalar": [2, 3, 4, 20], "reward": [2, 3, 4, 8, 9, 10, 11, 12, 13, 14, 17, 18, 20, 23, 24], "weight": [2, 3, 4, 20], "vector": [2, 4, 6, 7, 15, 16, 19, 20, 23], "shift": [2, 20], "singl": [2, 15, 16, 20, 24], "object": [2, 3, 4, 5, 9, 11, 13, 16, 17, 18, 20, 24], "multi": [2, 3, 5, 9, 11, 13, 17, 20, 24], "aka": [2, 20], "we": [2, 20, 24], "assign": [2, 20], "differ": [2, 20], "each": [2, 3, 4, 6, 7, 19, 20, 23, 24], "walker_0": [2, 20], "0": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "1": [2, 4, 6, 7, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20], "7": [2, 11, 12, 20], "2": [2, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 19, 20], "walker_1": [2, 20], "6": [2, 3, 11, 12, 13, 17, 20], "3": [2, 6, 7, 8, 10, 12, 14, 15, 17, 19, 20], "walker_2": [2, 20], "linearizereward": [2, 4, 20], "detail": [2, 3, 20], "rl": [2, 20], "definit": [2, 20], "see": [2, 3, 15, 16, 20, 21, 23], "decis": [2, 20], "A": [2, 3, 4, 6, 7, 16, 17, 19, 20], "util": [2, 3, 20, 23, 24], "base": [2, 3, 4, 16, 20], "analysi": [2, 20], "survei": [2, 20], "also": [2, 4, 20], "check": [2, 4, 20, 22, 23], "colab": [2, 20], "notebook": [2, 20], "extend": [2, 3, 23], "moaec": 2, "oppos": [2, 3], "ha": [2, 3, 4], "reward_spac": [2, 3, 4, 23], "member": [2, 3, 23], "document": [2, 3, 15, 16, 20, 21, 23], "sourc": [2, 3, 4, 6, 7, 19, 20], "overrid": [2, 3, 4, 23], "type": [2, 3, 4], "enforc": [2, 3], "list": [2, 3, 24], "agentid": [2, 3], "name": [2, 3, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 24], "all": [2, 3, 20, 21], "current": [2, 3, 24], "typic": [2, 3], "integ": [2, 3], "These": [2, 3, 8, 10, 12, 14], "mai": [2, 3], "progress": [2, 3], "ad": [2, 3], "remov": [2, 3], "num_ag": [2, 3], "The": [2, 3, 4, 6, 7, 8, 10, 12, 14, 15, 16, 19, 20, 24], "length": [2, 3, 6, 7, 19], "possible_ag": [2, 3, 4, 8, 10, 12, 14], "could": [2, 3], "gener": [2, 3], "equival": [2, 3], "space": [2, 3, 4, 5, 8, 9, 10, 11, 12, 13, 14, 17, 18, 23, 24], "cannot": [2, 3], "through": [2, 3], "plai": [2, 3], "max_num_ag": [2, 3], "agent_select": 2, "correspond": 2, "select": 2, "taken": [2, 5], "dict": [2, 3, 4, 9, 11, 13, 18], "bool": [2, 3], "ndarrai": [2, 3], "ani": [2, 24], "dtype": 2, "_scalartype_co": 2, "call": 2, "kei": [2, 3, 4], "instantan": 2, "after": [2, 8, 10, 12, 14], "accumul": 2, "note": 2, "doe": [2, 20, 21], "directli": 2, "access": [2, 4], "rather": 2, "store": 2, "intern": 2, "variabl": 2, "structur": 2, "look": 2, "like": [2, 3, 4, 24], "first": [2, 16], "second": [2, 16], "n": 2, "nth": 2, "float": [2, 3, 4, 6, 7, 19], "str": [2, 3, 6, 7, 19], "observation_spac": [2, 3, 8, 10, 12, 14], "gymnasium": [2, 3], "actiontyp": [2, 3], "accept": 2, "execut": [2, 3], "switch": 2, "control": 2, "next": 2, "int": [2, 3, 6, 7, 19], "start": [2, 12, 14], "state": [2, 3], "obstyp": [2, 3], "render": [2, 3, 6, 7, 19], "specifi": [2, 23], "self": [2, 23, 24], "mode": [2, 3, 6, 7, 19], "displai": [2, 3, 6, 7, 19], "window": [2, 3], "other": [2, 6, 7, 19, 24], "default": [2, 3, 15, 16], "ar": [2, 3, 4, 6, 7, 16, 19, 23, 24], "rgb_arrai": [2, 3], "which": [2, 3, 6, 7, 16, 19, 20, 23], "support": [2, 3], "outsid": [2, 3], "classic": [2, 3], "ansi": [2, 3], "string": [2, 3], "print": [2, 3, 4], "specif": [2, 3], "resourc": 2, "should": [2, 6, 7, 8, 10, 12, 14, 19, 23], "releas": 2, "subprocess": 2, "network": 2, "connect": [2, 11], "take": [2, 3, 4, 8, 10, 12, 14], "must": [2, 3, 4, 5], "same": [2, 3, 5], "valu": [2, 3, 4, 6, 7, 16, 19, 20], "implement": [2, 3, 24], "follow": [3, 6, 7, 8, 10, 12, 14, 16, 19, 20], "parallel_env": [3, 4, 23], "linearreward": 3, "while": [3, 5, 6, 7, 19], "In": 3, "etc": 3, "respect": 3, "data": 3, "so": [3, 4], "moparallel": 3, "gym": 3, "tupl": [3, 14], "receiv": 3, "dictionari": [3, 23], "And": 3, "frame": 3, "altern": 3, "global": 3, "view": 3, "appropri": 3, "central": 3, "train": 3, "decentr": 3, "qmix": 3, "transform": 4, "input": 4, "output": 4, "new": [4, 23], "some": [4, 20, 21], "valid": 4, "appli": 4, "between": [4, 5, 20], "nativ": 4, "On": 4, "top": 4, "few": 4, "split": 4, "own": 4, "modul": 4, "parallel_wrapp": 4, "mo_aec_to_parallel_wrapp": 4, "aec_env": 4, "convert": 4, "behavior": 4, "handl": 4, "vectori": 4, "keep": [4, 24], "inherit": 4, "avoid": [4, 6, 7, 16, 19], "code": [4, 6, 7, 19], "duplic": 4, "mo": [4, 5], "mo_parallel_to_aec_wrapp": 4, "aec_wrapp": 4, "repres": [4, 6, 7, 15, 16, 19], "agent_0": 4, "9": [4, 11, 12], "agent_1": 4, "8": [4, 9, 12, 14, 17], "linear": [4, 24], "initi": [4, 6, 7, 8, 10, 12, 14, 19, 23], "paramet": 4, "add": [4, 23], "normalizereward": 4, "idx": 4, "gamma": 4, "99": [4, 8], "epsilon": 4, "1e": 4, "08": 4, "normal": 4, "immedi": 4, "t": [4, 23], "exponenti": 4, "move": [4, 6, 7, 19], "averag": [4, 6, 7, 19], "fix": [4, 5], "varianc": 4, "have": [4, 20, 23], "scale": 4, "depend": [4, 20, 21], "past": 4, "trajectori": [4, 7, 19], "correctli": 4, "wa": [4, 6, 7, 19], "newli": 4, "instanti": 4, "recent": 4, "rang": 4, "shape": [4, 6, 7, 19, 23], "aecwrapp": 4, "whose": 4, "index": 4, "stabil": 4, "discount": 4, "factor": 4, "recordepisodestatist": 4, "record": 4, "episod": 4, "statist": 4, "end": [4, 15, 16], "includ": [5, 20, 21], "marl": 5, "literatur": 5, "well": [5, 20, 23], "version": [5, 17, 22, 23], "cooper": 5, "adversari": 5, "ob": 5, "descript": 5, "catch": 5, "v0": 5, "continu": [5, 6, 7, 15, 16, 19, 24], "distance_target": 5, "distance_other_dron": 5, "corner": 5, "target": [5, 6, 7, 19], "drone": [5, 6, 7, 19], "maintain": 5, "distanc": [5, 6, 7, 15, 16, 19], "themselv": 5, "escort": 5, "circl": 5, "around": 5, "mobil": 5, "its": 5, "destin": 5, "without": 5, "break": 5, "format": 5, "surround": [5, 6], "point": [5, 7, 19], "beach": 5, "discret": [5, 8, 9, 10, 11, 12, 13, 14, 18, 24], "todo": [5, 20], "breakthrough": 5, "congest": 5, "connect4": 5, "gem": 5, "mine": 5, "ingeni": 5, "item": 5, "gather": 5, "multiwalk": [5, 16], "pistonbal": 5, "game": [5, 13], "agent_i": [6, 7, 8, 10, 12, 13, 14, 18, 19], "box": [6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "float32": [6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19], "15": [6, 7, 12, 13, 18, 19], "10": [6, 7, 12, 19], "inf": [6, 7, 15, 16, 19], "catch_v0": 6, "parallel": [6, 7, 19, 21, 23], "learn": [6, 7, 19, 20, 21], "try": [6, 22], "escap": 6, "num_dron": [6, 7, 19], "xyz": [6, 7, 19], "coordin": [6, 7, 19, 20], "order": [6, 7, 19], "x_0": [6, 7, 19], "y_0": [6, 7, 19], "z_0": [6, 7, 19], "x_targ": [6, 7, 19], "y_targ": [6, 7, 19], "z_targ": [6, 7, 19], "x_1": [6, 7, 19], "y_1": [6, 7, 19], "z_1": [6, 7, 19], "x_n": [6, 7, 19], "y_n": [6, 7, 19], "z_n": [6, 7, 19], "3d": [6, 7, 15, 19], "speed": [6, 7, 19], "direct": [6, 7, 19], "2d": [6, 7, 16, 19], "minim": [6, 7, 19], "toward": [6, 7, 15, 16, 19], "maxim": [6, 7, 15, 16, 19], "collis": [6, 7, 19], "size": [6, 7, 19], "posit": [6, 7, 19], "5": [6, 7, 8, 12, 14, 18, 19], "one": [6, 7, 15, 16, 19], "condit": [6, 7, 19], "met": [6, 7, 19], "collid": [6, 7, 19], "ground": [6, 7, 19], "when": [6, 7, 19], "reach": [6, 7, 19], "200": [6, 7, 19], "area": [6, 7, 19], "side": [6, 7, 19], "amount": [6, 7, 19], "init_flying_po": [6, 7, 19], "nparrai": [6, 7, 19], "init_target_loc": [6, 7, 19], "target_spe": [6, 7, 19], "travel": [6, 7, 15, 16, 19], "timestep": [6, 7, 19], "adapt": [6, 7, 15, 16, 19], "felten": [6, 7, 19], "escort_v0": 7, "final_target_loc": [7, 19], "final": [7, 19], "num_intermediate_point": [7, 19], "number": [7, 19], "intermedi": [7, 19], "100": [8, 15, 16, 17], "18": [8, 12, 13], "73087": 8, "mobeach_v0": [8, 23], "beachdomain": 8, "problem": [8, 10, 14], "init": [8, 10, 12, 14], "method": [8, 10, 12, 14, 23], "argument": [8, 10, 12, 14], "defin": [8, 10, 12, 14, 23], "attribut": [8, 10, 12, 14], "player_i": [9, 11], "192": 9, "action_mask": [9, 11, 13, 18], "multibinari": 9, "int8": [9, 11, 13, 18], "4": [9, 12, 15, 16], "mobreakthrough_v0": 9, "4199": 10, "4200": 10, "mocongestion_v0": 10, "moconnect4_v0": 11, "four": 11, "19": [12, 17], "11": 12, "12": [12, 22], "13": 12, "14": 12, "16": 12, "17": 12, "20": [12, 22], "23": 12, "mogem_mining_v0": 12, "domain": 12, "5544": 13, "board": 13, "score": 13, "int32": 13, "tile": 13, "moingenious_v0": 13, "int64": 14, "moitem_gathering_v0": 14, "walker_i": [15, 16], "31": [15, 16], "46666667": 15, "110": [15, 16], "forc": [15, 16], "exert": [15, 16], "avail": [15, 16], "joint": [15, 16], "hip": [15, 16], "knee": [15, 16], "give": [15, 16], "element": [15, 16], "higher": [15, 16], "bound": [15, 16], "lower": [15, 16], "level": [15, 16], "dure": [15, 16], "46": [15, 16], "penalti": [15, 16], "fall": [15, 16], "drop": [15, 16], "If": [15, 16, 20], "terminate_on_fal": [15, 16], "true": [15, 16], "even": [15, 16], "still": [15, 16], "aliv": [15, 16], "100e": 16, "02": 16, "567e": 16, "209": 16, "54": 16, "momultiwalker_stability_v0": 16, "sister": 16, "angl": 16, "shake": 16, "01567": 16, "both": 16, "penal": 16, "piston_i": 17, "255": 17, "457": 17, "120": 17, "uint8": 17, "79e": 17, "04": 17, "00e": 17, "01": 17, "60": 17, "mopistonball_v0": 17, "225": 18, "50625": 18, "mosame_game_v0": 18, "multipl": 18, "surround_v0": 19, "static": 19, "reinforc": 20, "momarl": 20, "open": 20, "librari": [20, 24], "develop": 20, "compar": 20, "algorithm": [20, 21], "provid": [20, 24], "commun": 20, "set": [20, 24], "compliant": 20, "essenti": 20, "instead": [20, 23], "websit": 20, "public": 20, "discord": 20, "server": 20, "work": [20, 23], "join": 20, "aec": [20, 21, 23], "compon": [20, 21], "everyth": [20, 21, 23, 24], "basic": [20, 21], "usag": [20, 21], "problemat": [20, 21], "certain": [20, 21], "system": [20, 21], "test": [20, 21, 23], "suppli": [20, 21], "repositori": [20, 23], "research": 20, "pleas": 20, "inproceed": 20, "guid": 21, "2023": 22, "github": 22, "pypi": 22, "bump": 22, "workflow": 22, "don": 23, "env_nam": 23, "py": 23, "moparallelenv": 23, "moaecenv": 23, "addition": 23, "given": 23, "factori": 23, "raw_env": 23, "pure": 23, "constructor": 23, "practic": 23, "convers": 23, "insid": 23, "g": 23, "mo_parallel_to_aec": 23, "parallel_to_aec": 23, "directori": [23, 24], "export": 23, "all_modul": 23, "run": 23, "pytest": 23, "compat": 24, "possibl": 24, "file": 24, "cleanrl": 24, "philosophi": 24, "nevertheless": 24, "reus": 24, "tool": 24, "evalu": 24, "perform": 24, "indic": 24, "morl": 24, "baselin": 24, "paper": 24, "momappo": 24, "ol": 24, "team": 24}, "objects": {"momaland.utils.aec_wrappers": [[4, 0, 1, "", "LinearizeReward"], [4, 0, 1, "", "NormalizeReward"]], "momaland.utils.conversions": [[4, 0, 1, "", "mo_aec_to_parallel_wrapper"], [4, 0, 1, "", "mo_parallel_to_aec_wrapper"]], "momaland.utils.env": [[2, 0, 1, "", "MOAECEnv"], [3, 0, 1, "", "MOParallelEnv"]], "momaland.utils.env.MOAECEnv": [[2, 1, 1, "", "action_space"], [2, 2, 1, "", "action_spaces"], [2, 2, 1, "", "agent_selection"], [2, 2, 1, "", "agents"], [2, 1, 1, "", "close"], [2, 2, 1, "", "infos"], [2, 2, 1, "", "max_num_agents"], [2, 2, 1, "", "num_agents"], [2, 1, 1, "", "observation_space"], [2, 2, 1, "", "observation_spaces"], [2, 1, 1, "", "observe"], [2, 2, 1, "", "possible_agents"], [2, 1, 1, "", "render"], [2, 1, 1, "", "reset"], [2, 1, 1, "", "reward_space"], [2, 2, 1, "", "reward_spaces"], [2, 2, 1, "", "rewards"], [2, 1, 1, "", "step"], [2, 2, 1, "", "terminations"], [2, 2, 1, "", "truncations"]], "momaland.utils.env.MOParallelEnv": [[3, 1, 1, "", "action_space"], [3, 2, 1, "", "action_spaces"], [3, 2, 1, "", "agents"], [3, 1, 1, "", "close"], [3, 2, 1, "", "max_num_agents"], [3, 2, 1, "", "num_agents"], [3, 1, 1, "", "observation_space"], [3, 2, 1, "", "observation_spaces"], [3, 2, 1, "", "possible_agents"], [3, 1, 1, "", "render"], [3, 1, 1, "", "reset"], [3, 1, 1, "", "reward_space"], [3, 2, 1, "", "reward_spaces"], [3, 1, 1, "", "state"], [3, 1, 1, "", "step"]], "momaland.utils.parallel_wrappers": [[4, 0, 1, "", "LinearizeReward"], [4, 0, 1, "", "NormalizeReward"], [4, 0, 1, "", "RecordEpisodeStatistics"]]}, "objtypes": {"0": "py:class", "1": "py:method", "2": "py:attribute"}, "objnames": {"0": ["py", "class", "Python class"], "1": ["py", "method", "Python method"], "2": ["py", "attribute", "Python attribute"]}, "titleterms": {"404": 0, "page": 0, "Not": 0, "found": 0, "The": 0, "request": 0, "could": 0, "momaland": 1, "document": 1, "build": 1, "aec": [2, 4], "usag": [2, 3], "moaecenv": 2, "attribut": [2, 3], "method": [2, 3], "parallel": [3, 4], "moparallelenv": 3, "wrapper": 4, "util": 4, "convers": 4, "all": 5, "environ": [5, 23], "catch": 6, "observ": [6, 7, 15, 16, 19], "space": [6, 7, 15, 16, 19], "action": [6, 7, 15, 16, 19], "reward": [6, 7, 15, 16, 19], "start": [6, 7, 19], "state": [6, 7, 19], "episod": [6, 7, 15, 16, 19], "termin": [6, 7, 15, 16, 19], "truncat": [6, 7, 19], "argument": [6, 7, 15, 16, 19], "credit": [6, 7, 19], "escort": 7, "mo": [8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18], "beach": 8, "breakthrough": 9, "congest": 10, "connect4": 11, "gemmin": 12, "ingeni": 13, "itemgath": 14, "multiwalk": 15, "multiwalkerst": 16, "pistonbal": 17, "samegam": 18, "surround": 19, "api": 20, "instal": [20, 21], "cite": 20, "releas": 22, "note": 22, "v0": 22, "0": 22, "2": 22, "dummi": 22, "1": 22, "make": 23, "custom": 23, "setup": 23, "pre": 23, "commit": 23, "hook": 23, "learn": 24, "algorithm": 24}, "envversion": {"sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2, "sphinx.ext.viewcode": 1, "sphinx": 60}, "alltitles": {"404 - Page Not Found": [[0, "page-not-found"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "MOMAland documentation": [[1, "momaland-documentation"]], "Build the Documentation": [[1, "build-the-documentation"]], "AEC": [[2, "aec"], [4, "aec"]], "Usage": [[2, "usage"], [3, "usage"]], "MOAECEnv": [[2, "moaecenv"]], "Attributes": [[2, "attributes"], [3, "attributes"]], "Methods": [[2, "methods"], [3, "methods"]], "Parallel": [[3, "parallel"], [4, "parallel"]], "MOParallelEnv": [[3, "moparallelenv"]], "Wrappers and Utils": [[4, "wrappers-and-utils"]], "Conversion": [[4, "conversion"]], "AEC to Parallel": [[4, "aec-to-parallel"]], "Parallel to AEC": [[4, "parallel-to-aec"]], "All Environments": [[5, "all-environments"]], "Catch": [[6, "catch"]], "Observation Space": [[6, "observation-space"], [7, "observation-space"], [15, "observation-space"], [16, "observation-space"], [19, "observation-space"]], "Action Space": [[6, "action-space"], [7, "action-space"], [15, "action-space"], [16, "action-space"], [19, "action-space"]], "Reward Space": [[6, "reward-space"], [7, "reward-space"], [15, "reward-space"], [16, "reward-space"], [19, "reward-space"]], "Starting State": [[6, "starting-state"], [7, "starting-state"], [19, "starting-state"]], "Episode Termination": [[6, "episode-termination"], [7, "episode-termination"], [15, "episode-termination"], [16, "episode-termination"], [19, "episode-termination"]], "Episode Truncation": [[6, "episode-truncation"], [7, "episode-truncation"], [19, "episode-truncation"]], "Arguments": [[6, "arguments"], [7, "arguments"], [15, "arguments"], [16, "arguments"], [19, "arguments"]], "Credits": [[6, "credits"], [7, "credits"], [19, "credits"]], "Escort": [[7, "escort"]], "MO-Beach": [[8, "mo-beach"]], "MO-Breakthrough": [[9, "mo-breakthrough"]], "MO-Congestion": [[10, "mo-congestion"]], "MO-Connect4": [[11, "mo-connect4"]], "MO-GemMining": [[12, "mo-gemmining"]], "MO-Ingenious": [[13, "mo-ingenious"]], "MO-ItemGathering": [[14, "mo-itemgathering"]], "MO-Multiwalker": [[15, "mo-multiwalker"]], "MO-MultiwalkerStability": [[16, "mo-multiwalkerstability"]], "MO-Pistonball": [[17, "mo-pistonball"]], "MO-SameGame": [[18, "mo-samegame"]], "Surround": [[19, "surround"]], "API": [[20, "api"]], "Install": [[20, "install"], [21, "install"]], "Citing": [[20, "citing"]], "Release Notes": [[22, "release-notes"]], "v0.0.2: Dummy release 2": [[22, "release-v0-0-2"]], "v0.0.1: Dummy release": [[22, "release-v0-0-1"]], "Making a Custom Environment": [[23, "making-a-custom-environment"]], "Setup pre-commit hooks": [[23, "setup-pre-commit-hooks"]], "Learning algorithms": [[24, "learning-algorithms"]]}, "indexentries": {"moaecenv (class in momaland.utils.env)": [[2, "momaland.utils.env.MOAECEnv"]], "action_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.action_space"]], "action_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.action_spaces"]], "agent_selection (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.agent_selection"]], "agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.agents"]], "close() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.close"]], "infos (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.infos"]], "max_num_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.max_num_agents"]], "num_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.num_agents"]], "observation_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.observation_space"]], "observation_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.observation_spaces"]], "observe() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.observe"]], "possible_agents (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.possible_agents"]], "render() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.render"]], "reset() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.reset"]], "reward_space() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.reward_space"]], "reward_spaces (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.reward_spaces"]], "rewards (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.rewards"]], "step() (momaland.utils.env.moaecenv method)": [[2, "momaland.utils.env.MOAECEnv.step"]], "terminations (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.terminations"]], "truncations (momaland.utils.env.moaecenv attribute)": [[2, "momaland.utils.env.MOAECEnv.truncations"]], "moparallelenv (class in momaland.utils.env)": [[3, "momaland.utils.env.MOParallelEnv"]], "action_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.action_space"]], "action_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.action_spaces"]], "agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.agents"]], "close() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.close"]], "max_num_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.max_num_agents"]], "num_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.num_agents"]], "observation_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.observation_space"]], "observation_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.observation_spaces"]], "possible_agents (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.possible_agents"]], "render() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.render"]], "reset() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.reset"]], "reward_space() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.reward_space"]], "reward_spaces (momaland.utils.env.moparallelenv attribute)": [[3, "momaland.utils.env.MOParallelEnv.reward_spaces"]], "state() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.state"]], "step() (momaland.utils.env.moparallelenv method)": [[3, "momaland.utils.env.MOParallelEnv.step"]], "linearizereward (class in momaland.utils.aec_wrappers)": [[4, "momaland.utils.aec_wrappers.LinearizeReward"]], "linearizereward (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.LinearizeReward"]], "normalizereward (class in momaland.utils.aec_wrappers)": [[4, "momaland.utils.aec_wrappers.NormalizeReward"]], "normalizereward (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.NormalizeReward"]], "recordepisodestatistics (class in momaland.utils.parallel_wrappers)": [[4, "momaland.utils.parallel_wrappers.RecordEpisodeStatistics"]], "mo_aec_to_parallel_wrapper (class in momaland.utils.conversions)": [[4, "momaland.utils.conversions.mo_aec_to_parallel_wrapper"]], "mo_parallel_to_aec_wrapper (class in momaland.utils.conversions)": [[4, "momaland.utils.conversions.mo_parallel_to_aec_wrapper"]]}}) \ No newline at end of file