From 3aacf6a10c6928266dbdbddbd09d42a7ba86b879 Mon Sep 17 00:00:00 2001 From: LucasAlegre Date: Mon, 28 Oct 2024 16:25:57 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Farama-F?= =?UTF-8?q?oundation/MO-Gymnasium@4d05d828fde929b12d4a768293d4c8441bd8446f?= =?UTF-8?q?=20=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- main/.buildinfo | 2 +- main/environments/mujoco/index.html | 28 ++++++++++++++-------------- main/release_notes/index.html | 24 +++++++++++++++++++++++- main/searchindex.js | 2 +- 4 files changed, 39 insertions(+), 17 deletions(-) diff --git a/main/.buildinfo b/main/.buildinfo index 7ce12ae..899f6cf 100644 --- a/main/.buildinfo +++ b/main/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: 91c9497a93e236aa6028d33b34ef135f +config: 1f2d7009192ea8c77aa9d5d14e6adfae tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/main/environments/mujoco/index.html b/main/environments/mujoco/index.html index c795081..9950eed 100644 --- a/main/environments/mujoco/index.html +++ b/main/environments/mujoco/index.html @@ -343,40 +343,40 @@

MuJoCo -

mo-reacher-v4

+

mo-reacher-v5

Continuous / Discrete

[target_1, target_2, target_3, target_4]

-

Mujoco version of mo-reacher-v0, based on Reacher-v4 environment.

+

Multi-objective version of Reacher-v5 environment.

-

mo-hopper-v4

+

mo-hopper-v5

Continuous / Continuous

[velocity, height, energy]

-

Multi-objective version of Hopper-v4 env.

+

Multi-objective version of Hopper-v5 env.

-

mo-halfcheetah-v4

+

mo-halfcheetah-v5

Continuous / Continuous

[velocity, energy]

-

Multi-objective version of HalfCheetah-v4 env. Similar to Xu et al. 2020.

+

Multi-objective version of HalfCheetah-v5 env. Similar to Xu et al. 2020.

-

mo-walker2d-v4

+

mo-walker2d-v5

Continuous / Continuous

[velocity, energy]

-

Multi-objective version of Walker2d-v4 env.

+

Multi-objective version of Walker2d-v5 env.

-

mo-ant-v4

+

mo-ant-v5

Continuous / Continuous

[x_velocity, y_velocity, energy]

-

Multi-objective version of Ant-v4 env.

+

Multi-objective version of Ant-v5 env.

-

mo-swimmer-v4

+

mo-swimmer-v5

Continuous / Continuous

[velocity, energy]

-

Multi-objective version of Swimmer-v4 env.

+

Multi-objective version of Swimmer-v5 env.

-

mo-humanoid-v4

+

mo-humanoid-v5

Continuous / Continuous

[velocity, energy]

-

Multi-objective version of Humonoid-v4 env.

+

Multi-objective version of Humonoid-v5 env.

diff --git a/main/release_notes/index.html b/main/release_notes/index.html index ab2676f..e20a491 100644 --- a/main/release_notes/index.html +++ b/main/release_notes/index.html @@ -332,6 +332,27 @@

Release Notes

+
+

v1.3.0: MO-Gymnasium 1.3.0 Release: New Mujoco v5 Environments

+

Released on 2024-10-28 - GitHub - PyPI

+

This release adds the new Mujoco v5 environments:

+
    +
  • mo-ant-v5
  • +
  • mo-ant-2obj-v5
  • +
  • mo-hopper-v5
  • +
  • mo-hopper-2obj-v5
  • +
  • mo-walker2d-v5
  • +
  • mo-halfcheetah-v5
  • +
  • mo-humanoid-v5
  • +
  • mo-swimmer-v5
  • +
+

What's Changed

+ +

Full Changelog: v1.2.0...v1.3.0

v1.2.0: MO-Gymnasium 1.2.0 Release: Update Gymnasium to v1.0.0, New Mountaincar Environments, Documentation and Test Improvements, and more

Released on 2024-10-16 - GitHub - PyPI

@@ -441,7 +462,7 @@

MO-Gymnasium 1.0.0 Release Notes

reward = forward_reward - ctrl_cost

With MORL, users have the flexibility to determine the compromises they desire based on their preferences for each objective. Consequently, the environments in MO-Gymnasium do not have predefined weights. Thus, MO-Gymnasium extends the capabilities of Gymnasium to the multi-objective setting, where the agents receives a vectorial reward.

For example, here is an illustration of the multiple policies learned by an MORL agent for the mo-halfcheetah domain, balancing between saving battery and speed:

- +

This release marks the first mature version of MO-Gymnasium within Farama, indicating that the API is stable, and we have achieved a high level of quality in this library.

API

  • Release Notes
      +
    • v1.3.0: MO-Gymnasium 1.3.0 Release: New Mujoco v5 Environments
    • v1.2.0: MO-Gymnasium 1.2.0 Release: Update Gymnasium to v1.0.0, New Mountaincar Environments, Documentation and Test Improvements, and more
    • v1.1.0: MO-Gymnasium 1.1.0 Release: New MuJoCo environments, Mirrored Deep Sea Treasure, Fruit Tree rendering, and more
    • v1.0.1: MO-Gymnasium 1.0.1 Release: Support Gymnasium 0.29, breakable-bottles pygame render, and more
    • diff --git a/main/searchindex.js b/main/searchindex.js index bc828f0..84b4baf 100644 --- a/main/searchindex.js +++ b/main/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"0.1.1": [[47, "release-0-1-1"]], "0.1.2": [[47, "release-0-1-2"]], "0.2.0": [[47, "release-0-2-0"]], "0.2.1": [[47, "release-0-2-1"]], "1. Create a new environment class": [[48, "create-a-new-environment-class"]], "2. Register the environment": [[48, "register-the-environment"]], "3. Test the environment": [[48, "test-the-environment"]], "4. Instantiate your environment": [[48, "instantiate-your-environment"]], "404 - Page Not Found": [[0, null]], "API": [[44, null], [45, null]], "Acknowledgements": [[3, "acknowledgements"]], "Action Space": [[4, "action-space"], [6, "action-space"], [7, "action-space"], [8, "action-space"], [9, "action-space"], [10, "action-space"], [11, "action-space"], [13, "action-space"], [14, "action-space"], [15, "action-space"], [34, "action-space"], [39, "action-space"], [40, "action-space"]], "Arguments": [[4, "arguments"], [6, "arguments"], [7, "arguments"], [8, "arguments"], [9, "arguments"], [10, "arguments"], [13, "arguments"], [14, "arguments"], [15, "arguments"], [40, "arguments"]], "Breakable-Bottles": [[4, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Citation": [[41, null]], "Citing": [[44, "citing"]], "Classic Control": [[5, null]], "Community": [[3, null]], "Creating a custom environment": [[48, null]], "Credits": [[4, "credits"], [6, "credits"], [7, "credits"], [8, "credits"], [9, "credits"], [10, "credits"], [13, "credits"], [14, "credits"], [15, "credits"], [39, "credits"], [40, "credits"]], "Deep-Sea-Treasure": [[6, null]], "Deep-Sea-Treasure-Concave": [[7, null]], "Deep-Sea-Treasure-Mirrored": [[8, null]], "Description": [[4, "description"], [6, "description"], [7, "description"], [8, "description"], [9, "description"], [10, "description"], [11, "description"], [13, "description"], [14, "description"], [15, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [21, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [27, "description"], [28, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [39, "description"], [40, "description"]], "Episode Termination": [[4, "episode-termination"], [6, "episode-termination"], [7, "episode-termination"], [8, "episode-termination"], [10, "episode-termination"], [11, "episode-termination"], [13, "episode-termination"], [14, "episode-termination"], [15, "episode-termination"], [35, "episode-termination"], [39, "episode-termination"]], "Fishwood": [[9, null]], "Four-Room": [[10, null]], "Fruit-Tree": [[11, null]], "Grid-World": [[12, null]], "Install": [[44, "install"], [46, null]], "LinearReward": [[50, "linearreward"]], "List of Publications": [[43, null]], "MO-Ant": [[17, null]], "MO-Ant-2D": [[18, null]], "MO-Ant-2Obj": [[19, null]], "MO-Gymnasium 0.3.0 Release: Migrate to Gymnasium": [[47, "release-0-3-0"]], "MO-Gymnasium 0.3.1 Release: Improved documentation and MuJoco MO-Reacher environment": [[47, "release-0-3-1"]], "MO-Gymnasium 0.3.2 Release: Bug fixes, improved webpage": [[47, "release-0-3-2"]], "MO-Gymnasium documentation": [[1, null]], "MO-Halfcheetah": [[20, null]], "MO-Highway": [[21, null]], "MO-Highway-Fast": [[22, null]], "MO-Hopper": [[23, null]], "MO-Hopper-2D": [[24, null]], "MO-Hopper-2Obj": [[25, null]], "MO-Humanoid": [[26, null]], "MO-Lunar-Lander": [[27, null]], "MO-Lunar-Lander-Continuous": [[28, null]], "MO-Mountaincar": [[29, null]], "MO-Mountaincar-3D": [[30, null]], "MO-Mountaincar-Timemove": [[31, null]], "MO-Mountaincar-Timespeed": [[32, null]], "MO-Mountaincarcontinuous": [[33, null]], "MO-Reacher": [[34, null]], "MO-Supermario": [[35, null]], "MO-Swimmer": [[36, null]], "MO-Walker2D": [[37, null]], "MOClipReward": [[50, "moclipreward"]], "MOMaxAndSkipObservation": [[50, "momaxandskipobservation"]], "MONormalizeReward": [[50, "monormalizereward"]], "MORL Baselines": [[42, null]], "MORecordEpisodeStatistics": [[49, "morecordepisodestatistics"], [50, "morecordepisodestatistics"]], "MOSyncVectorEnv": [[49, "mosyncvectorenv"]], "Minecart": [[13, null]], "Minecart-Deterministic": [[14, null]], "Minecart-Rgb": [[15, null]], "Miscellaneous": [[16, null]], "MuJoCo": [[38, null]], "Observation Space": [[4, "observation-space"], [6, "observation-space"], [7, "observation-space"], [8, "observation-space"], [9, "observation-space"], [10, "observation-space"], [11, "observation-space"], [13, "observation-space"], [14, "observation-space"], [15, "observation-space"], [34, "observation-space"], [39, "observation-space"], [40, "observation-space"]], "References": [[10, "references"]], "Release Notes": [[47, null]], "Resource-Gathering": [[39, null]], "Reward Space": [[4, "reward-space"], [6, "reward-space"], [7, "reward-space"], [8, "reward-space"], [9, "reward-space"], [10, "reward-space"], [11, "reward-space"], [13, "reward-space"], [14, "reward-space"], [15, "reward-space"], [17, "reward-space"], [18, "reward-space"], [19, "reward-space"], [20, "reward-space"], [21, "reward-space"], [23, "reward-space"], [24, "reward-space"], [25, "reward-space"], [26, "reward-space"], [27, "reward-space"], [28, "reward-space"], [34, "reward-space"], [35, "reward-space"], [36, "reward-space"], [37, "reward-space"], [39, "reward-space"], [40, "reward-space"]], "Reward space:": [[29, "reward-space"], [30, "reward-space"], [31, "reward-space"], [32, "reward-space"], [33, "reward-space"]], "Starting State": [[4, "starting-state"], [6, "starting-state"], [7, "starting-state"], [8, "starting-state"], [9, "starting-state"], [10, "starting-state"], [11, "starting-state"], [13, "starting-state"], [14, "starting-state"], [15, "starting-state"], [39, "starting-state"], [40, "starting-state"]], "Termination": [[9, "termination"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Vector Wrappers": [[49, null]], "Version History": [[17, "version-history"], [19, "version-history"], [20, "version-history"], [23, "version-history"], [25, "version-history"], [37, "version-history"]], "Version History:": [[26, "version-history"], [34, "version-history"], [36, "version-history"]], "Water-Reservoir": [[40, null]], "Wrappers": [[50, null]], "v0.3.3: MO-Gymnasium 0.3.3 Release: Policy Evaluation bug fix, better documentation page": [[47, "release-v0-3-3"]], "v0.3.4: MO-Gymnasium 0.3.4 Release: Known Pareto Front, improved renders and documentation": [[47, "release-v0-3-4"]], "v1.0.0: MO-Gymnasium becomes mature": [[47, "release-v1-0-0"]], "v1.0.1: MO-Gymnasium 1.0.1 Release: Support Gymnasium 0.29, breakable-bottles pygame render, and more": [[47, "release-v1-0-1"]], "v1.1.0: MO-Gymnasium 1.1.0 Release: New MuJoCo environments, Mirrored Deep Sea Treasure, Fruit Tree rendering, and more": [[47, "release-v1-1-0"]], "v1.2.0: MO-Gymnasium 1.2.0 Release: Update Gymnasium to v1.0.0, New Mountaincar Environments, Documentation and Test Improvements, and more": [[47, "release-v1-2-0"]]}, "docnames": ["404", "README", "citing/citing", "community/community", "environments/breakable-bottles", "environments/classical", "environments/deep-sea-treasure", "environments/deep-sea-treasure-concave", "environments/deep-sea-treasure-mirrored", "environments/fishwood", "environments/four-room", "environments/fruit-tree", "environments/grid-world", "environments/minecart", "environments/minecart-deterministic", "environments/minecart-rgb", "environments/misc", "environments/mo-ant", "environments/mo-ant-2d", "environments/mo-ant-2obj", "environments/mo-halfcheetah", "environments/mo-highway", "environments/mo-highway-fast", "environments/mo-hopper", "environments/mo-hopper-2d", "environments/mo-hopper-2obj", "environments/mo-humanoid", "environments/mo-lunar-lander", "environments/mo-lunar-lander-continuous", "environments/mo-mountaincar", "environments/mo-mountaincar-3d", "environments/mo-mountaincar-timemove", "environments/mo-mountaincar-timespeed", "environments/mo-mountaincarcontinuous", "environments/mo-reacher", "environments/mo-supermario", "environments/mo-swimmer", "environments/mo-walker2d", "environments/mujoco", "environments/resource-gathering", "environments/water-reservoir", "examples/citation", "examples/morl_baselines", "examples/publications", "index", "introduction/api", "introduction/install", "release_notes", "tutorials/custom_env", "wrappers/vector_wrappers", "wrappers/wrappers"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["404.md", "README.md", "citing/citing.md", "community/community.md", "environments/breakable-bottles.md", "environments/classical.md", "environments/deep-sea-treasure.md", "environments/deep-sea-treasure-concave.md", "environments/deep-sea-treasure-mirrored.md", "environments/fishwood.md", "environments/four-room.md", "environments/fruit-tree.md", "environments/grid-world.md", "environments/minecart.md", "environments/minecart-deterministic.md", "environments/minecart-rgb.md", "environments/misc.md", "environments/mo-ant.md", "environments/mo-ant-2d.md", "environments/mo-ant-2obj.md", "environments/mo-halfcheetah.md", "environments/mo-highway.md", "environments/mo-highway-fast.md", "environments/mo-hopper.md", "environments/mo-hopper-2d.md", "environments/mo-hopper-2obj.md", "environments/mo-humanoid.md", "environments/mo-lunar-lander.md", "environments/mo-lunar-lander-continuous.md", "environments/mo-mountaincar.md", "environments/mo-mountaincar-3d.md", "environments/mo-mountaincar-timemove.md", "environments/mo-mountaincar-timespeed.md", "environments/mo-mountaincarcontinuous.md", "environments/mo-reacher.md", "environments/mo-supermario.md", "environments/mo-swimmer.md", "environments/mo-walker2d.md", "environments/mujoco.md", "environments/resource-gathering.md", "environments/water-reservoir.md", "examples/citation.md", "examples/morl_baselines.md", "examples/publications.md", "index.md", "introduction/api.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "wrappers/vector_wrappers.md", "wrappers/wrappers.md"], "indexentries": {"linearreward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.LinearReward", false]], "moclipreward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MOClipReward", false]], "momaxandskipobservation (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MOMaxAndSkipObservation", false]], "monormalizereward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MONormalizeReward", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MORecordEpisodeStatistics", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers.vector)": [[49, "mo_gymnasium.wrappers.vector.MORecordEpisodeStatistics", false]], "mosyncvectorenv (class in mo_gymnasium.wrappers.vector)": [[49, "mo_gymnasium.wrappers.vector.MOSyncVectorEnv", false]]}, "objects": {"mo_gymnasium.wrappers": [[50, 0, 1, "", "LinearReward"], [50, 0, 1, "", "MOClipReward"], [50, 0, 1, "", "MOMaxAndSkipObservation"], [50, 0, 1, "", "MONormalizeReward"], [50, 0, 1, "", "MORecordEpisodeStatistics"]], "mo_gymnasium.wrappers.vector": [[49, 0, 1, "", "MORecordEpisodeStatistics"], [49, 0, 1, "", "MOSyncVectorEnv"]]}, "objnames": {"0": ["py", "class", "Python class"]}, "objtypes": {"0": "py:class"}, "terms": {"": [4, 5, 6, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 37, 44, 45, 47, 50], "0": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 49, 50], "01": 47, "02": 47, "03": 47, "06": 47, "07": [29, 30, 31, 32, 33], "08": [47, 50], "09": 47, "1": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 49, 50], "10": [6, 7, 8, 11, 12, 27, 28, 39, 40, 47], "100": [27, 28, 35, 47, 49, 50], "101": 47, "103": 47, "105": [17, 19, 47], "106": 47, "107": 47, "11": [6, 7, 23, 24, 25, 47], "1109": 40, "1145": 39, "12": 47, "124": [7, 8], "13": [10, 47], "1390156": 39, "1390162": 39, "14": [10, 47], "16": 47, "160": 40, "17": [20, 26, 37], "18": 47, "19": 47, "1e": [23, 25, 36, 37, 50], "2": [4, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 49], "20": [8, 47], "200": 9, "2008": [12, 39], "2010": 12, "2011": 5, "2012": 40, "2013": 16, "2017": 10, "2018": 12, "2019": [6, 7, 8, 11, 12, 13, 14, 15, 16], "2020": 38, "2021": 12, "2022": [2, 5, 12, 43, 47], "2022bnaic": 2, "2023": [41, 43, 44, 47], "2024": [43, 47], "21": 47, "23": [6, 47], "24": 47, "240": [4, 35], "25": [26, 35, 47], "255": [15, 35], "256": 35, "25th": 39, "26": 47, "27": [18, 47], "28": [27, 28], "2d": [6, 7, 8, 10, 13, 14, 15, 17, 19, 23, 25, 33, 47, 49], "2obj": [17, 23], "3": [4, 6, 7, 8, 10, 13, 14, 15, 17, 18, 19, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 35, 37, 39, 40, 49], "30": 47, "31": 47, "33": 47, "34": 47, "348": 26, "34th": 2, "35": 47, "360": 4, "37": 47, "37th": [41, 44], "3d": [5, 13, 14, 15, 29, 31, 32], "4": [4, 6, 7, 8, 10, 13, 14, 15, 26, 27, 28, 34, 35, 36, 39, 40, 49, 50], "40": 47, "41": [39, 47], "42": [47, 49], "43": 47, "45": 47, "46": 47, "47": [39, 47], "480": 15, "5": [4, 11, 12, 13, 14, 15, 21, 22, 27, 28, 35, 39, 47], "50": [4, 47], "51": 47, "52": 47, "53": 47, "55": 47, "56": 47, "57": 47, "58": 47, "59": 47, "6": [11, 12, 13, 14, 15, 20, 27, 28, 29, 30, 31, 32, 33, 34, 37], "60": 47, "61": 47, "62": 47, "6252759": 40, "63": 11, "64": 47, "65": 47, "67": 47, "69": 47, "7": [6, 11, 12, 13, 14, 15, 47, 49], "70": 47, "72": 47, "73": 47, "74": 47, "75": 47, "76": 47, "77": 47, "79": 47, "8": [17, 18, 19, 27, 28, 36, 40, 44, 45, 47], "80": 47, "81": 47, "83": 47, "84": 47, "86": 47, "87": 47, "89": 47, "9": 34, "90": 47, "91": 47, "92": 47, "93": 47, "94": 47, "95": 47, "97": 47, "99": [47, 50], "A": [2, 4, 10, 16, 17, 18, 19, 22, 23, 25, 29, 30, 31, 32, 33, 40, 41, 43, 44, 45, 50], "As": [4, 44, 45], "At": 49, "But": 50, "By": [29, 30, 31, 32, 40], "For": [1, 34, 44, 45, 47, 49], "If": [3, 13, 14, 15, 17, 18, 19, 23, 24, 25, 40, 41, 44, 48], "In": [4, 47], "It": [42, 44, 45, 47, 48], "Of": 47, "The": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 33, 34, 35, 36, 37, 39, 40, 44, 47, 48, 49], "There": 40, "To": [1, 6, 7, 8, 44, 46], "With": 47, "_": 49, "__init__": 48, "_build": 1, "_episod": 49, "_forward_reward_weight": 47, "_modul": 50, "aama": 43, "abel": [13, 14, 15, 16], "about": [1, 5], "abov": 4, "acceler": [13, 14, 15], "accept": 47, "access": [47, 49], "account": [4, 12], "achiev": 47, "act": [44, 45, 47], "action": [5, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 47, 48, 49], "action_spac": [48, 49], "acttyp": 50, "ad": [17, 18, 19, 23, 24, 25, 47, 48, 49], "adapt": [6, 7, 8, 10], "add": [29, 30, 31, 32, 43, 47], "add_speed_object": [29, 30, 31, 32], "addit": 5, "addition": 47, "after": [9, 47, 50], "again": 4, "agent": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 39, 40, 47], "ai": 4, "al": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 38, 43], "alegr": [2, 12, 41, 43, 44], "algorithm": [42, 44], "align": 43, "all": [3, 17, 18, 19, 39, 44, 46, 47, 49, 50], "allow": 47, "also": [3, 16, 44, 45, 47], "altern": [29, 30, 31, 32], "alwai": [6, 7, 8], "amount": [16, 40], "amp": 47, "an": [5, 10, 29, 30, 31, 32, 35, 39, 40, 44, 45, 47, 48, 50], "ana": [2, 41, 44], "andrea": 47, "andr\u00e9": 10, "angl": 34, "angular": 34, "ani": 49, "ann": [2, 41, 44], "ansi": 40, "ansimuz": [6, 7, 8], "ant": 38, "antenv": [17, 18, 19], "api": [42, 47, 48], "appear": 2, "appli": [4, 34, 49], "approach": 4, "approxim": 43, "ar": [3, 4, 13, 14, 15, 16, 39, 40, 47, 48, 49, 50], "arm": 34, "arrai": [10, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 48, 49, 50], "art": [4, 6, 7, 8, 47], "artifici": 2, "asid": 3, "ask": 3, "asset": [4, 39, 47], "assist": [4, 6, 7, 8], "associ": 47, "atari_wrapp": 50, "attribut": 48, "australia": 40, "author": [2, 41, 44], "autobuild": 1, "automat": [1, 47, 48], "avail": [47, 49, 50], "averag": 50, "avoid": [10, 16], "axel": [13, 14, 15], "axelabel": 3, "axi": [23, 24, 25], "b": 1, "back": 47, "background": [6, 7, 8, 40], "backward": 5, "balanc": 47, "barret": 12, "barreto": 10, "barrett": 39, "base": [3, 4, 13, 14, 15, 34, 38, 40, 43, 47, 50], "baselin": 47, "baselines3": 50, "batteri": 47, "bazzan": [2, 41, 44], "becaus": 4, "been": [4, 5, 47], "befor": 49, "begin": [49, 50], "behind": 5, "benchmark": [41, 43, 44], "benefit": 47, "benelearn": 2, "benelux": 2, "between": [35, 40, 44, 47, 50], "bib": 47, "binari": [10, 11, 12], "blob": [13, 14, 15], "blue": 10, "bnaic": [2, 43], "bnj6kubtg6": 44, "booktitl": [2, 41, 44], "bool": 49, "boolean": [4, 49], "both": 50, "both_norm_env": 50, "bottl": 12, "bottle_reward": 4, "bottles_carri": 4, "bottles_deliv": [4, 12], "bottles_drop": 4, "bound": [40, 47], "box": [6, 7, 8, 17, 18, 19, 20, 23, 24, 25, 26, 28, 33, 36, 37, 40], "brake": [13, 14, 15], "break": 47, "breakabl": 12, "breakablebottl": 4, "brisban": 40, "bro": 35, "bruno": [2, 41, 44], "budget": 43, "buffer": 49, "buffer_length": [49, 50], "bugfix": 47, "bump": 47, "button": 47, "c": [2, 41, 44], "cai": 43, "calcul": 4, "call": 47, "callabl": 49, "can": [3, 4, 9, 11, 13, 14, 15, 17, 19, 23, 25, 29, 30, 31, 32, 40, 44, 45, 46, 47, 49, 50], "cannot": 4, "capabl": 47, "capac": [13, 14, 15], "car": [5, 29, 30, 31, 32, 47], "carb": [11, 12], "care": 49, "carri": 4, "cart": [13, 14, 15], "castelletti": 40, "catch": 9, "caus": 47, "cc": 47, "cd": 1, "cell": 12, "central": 34, "certain": [44, 46], "chanc": 12, "chang": [1, 6, 7, 8, 20, 26, 29, 30, 31, 32, 47], "changelog": 47, "check": [44, 45, 47], "chose": 11, "ci": 47, "circl": 10, "citat": 47, "cite": 41, "class": [5, 44, 45, 49, 50], "classic": [6, 7, 8, 48], "clip": 50, "close": 48, "co": [13, 14, 15, 34], "code": [3, 6, 7, 8, 9, 10, 13, 14, 15, 40, 47, 50], "coin": [16, 35], "colab": [44, 45], "collect": [9, 10, 11, 12, 13, 14, 15, 16, 35, 39, 47], "collis": [16, 21], "com": [3, 13, 14, 15], "combin": 47, "commit": 47, "common": 50, "commun": [44, 47], "compar": 44, "complet": 50, "compliant": 44, "compon": [10, 47, 50], "compromis": 47, "comput": [34, 47, 48], "concav": [12, 47], "concave_map": [6, 7, 8], "conduct": 47, "confer": [2, 39, 40, 41, 44], "config": [13, 14, 15], "configur": [13, 14, 15], "conflict": 47, "conor": 3, "consequ": 47, "consist": 39, "constructor": 48, "consum": [13, 14, 15], "consumpt": [5, 13, 14, 15, 16], "contact": [17, 19, 26], "contain": [1, 4, 10, 11, 12, 13, 14, 15, 29, 30, 31, 32, 33, 34, 42], "content": 40, "context": 47, "continu": [5, 6, 7, 8, 16, 33, 38, 40, 47], "contribut": [1, 3, 4, 47], "contributor": [3, 47], "control": [6, 7, 8, 9, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "control_cost": 47, "converg": 5, "convers": 47, "convex": [6, 7, 8], "coordin": [6, 7, 8, 39, 44], "copi": 49, "corner": [13, 14, 15], "correct": 47, "correspond": [16, 29, 30, 31, 32, 40], "cost": [17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 36, 37, 40], "cost_flood": 16, "cost_object": [17, 18, 19, 23, 24, 25], "crash": [27, 28], "creat": [4, 6, 7, 8, 44, 45, 47], "creation": 47, "criteria": 39, "ctrl_cost": 47, "cumul": [49, 50], "current": [4, 6, 7, 8, 40], "custom": 47, "d": [11, 12, 43], "da": [2, 41, 44], "dall": [4, 6, 7, 8], "dam": [16, 40], "danoi": [2, 41, 44], "deal": 48, "death": 16, "decis": 40, "decomposit": 43, "deep": [3, 12, 49, 50], "deep_sea_treasur": 47, "deepseatreasur": [6, 7, 8], "default": [6, 7, 8, 13, 14, 15, 29, 30, 31, 32, 40], "deficit": 40, "deficit_wat": 16, "defin": [4, 5, 16, 34, 48], "definit": [44, 45], "deliv": [4, 12], "demand": 40, "deni": [3, 9], "dens": [13, 14, 15], "depend": [44, 46], "deprec": 47, "depth": [11, 12], "deque_s": 49, "descript": [5, 12, 16, 38], "design": [47, 49], "desir": 47, "destin": 12, "detail": [5, 44, 45], "determin": 47, "determinist": 47, "develop": 44, "deviat": 50, "di": 35, "diamond": 39, "dict": 4, "dictionari": [4, 12], "did": 4, "differ": [4, 12, 47], "dim_reward": 49, "dimens": [4, 47], "dimension": [6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 39], "directli": [47, 49, 50], "directori": 48, "dirhtml": 1, "disc_episode_return": 47, "discord": [3, 44], "discount": [48, 49, 50], "discret": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 21, 22, 27, 29, 30, 31, 32, 34, 35, 38, 39, 47], "dissert": 5, "distanc": [34, 48], "distinct": 47, "distribut": 43, "do": 47, "doc": [1, 47], "document": [44, 48], "doe": [44, 46, 50], "doi": 40, "domain": 47, "done": [48, 49], "dot": 50, "down": [6, 7, 8, 10, 39], "downstream": 40, "dr": [49, 50], "drop": [4, 47], "dst": [12, 47], "dst_map": [6, 7, 8], "dtype": [47, 49], "due": [5, 40], "dynmorl": 3, "e": [1, 2, 4, 6, 7, 8, 12, 33, 41, 44, 47], "each": [4, 6, 7, 8, 11, 13, 14, 15, 29, 30, 31, 32, 33, 34, 47, 49], "eat": 12, "edit": 47, "effici": 43, "either": 9, "el": [2, 41, 44], "elaps": [49, 50], "elbow": 34, "element": [39, 47], "els": [10, 35, 39], "en": 50, "enabl": 47, "end": [9, 13, 14, 15, 49], "enemi": [4, 12, 16, 35, 39], "energi": 38, "engin": [27, 28], "entri": 43, "entry_point": 48, "env": [3, 5, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 37, 38, 44, 45, 47, 48, 49, 50], "env_fn": 49, "environ": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 43, 44, 45, 46, 49], "episod": [9, 40, 49, 50], "epsilon": 50, "equival": 5, "error": 47, "esr": [12, 47], "essenti": [44, 48], "et": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 38, 43], "eval_mo": 47, "everi": [1, 11, 12, 50], "exampl": [10, 42, 44, 45, 47, 49, 50], "except": 50, "excess": 40, "execut": [16, 40], "exhaust": 47, "expand": 47, "expect": 9, "extend": 47, "extra": [5, 29, 30, 31, 32], "extract": 50, "ezpickl": 47, "f": [3, 40], "fair": 43, "fall": 47, "fals": [17, 18, 19, 23, 24, 25, 49], "famili": [44, 46], "fan": 43, "fantasi": [6, 7, 8], "far": 35, "farama": [3, 13, 14, 15, 17, 19, 20, 23, 25, 26, 34, 36, 37, 44, 47], "fast": [16, 47], "fat": [11, 12], "featur": [3, 10, 47], "feder": 43, "felten": [2, 12, 41, 43, 44], "felten_toolkit_2023": [41, 44], "few": [47, 49, 50], "ffelten": 47, "file": [13, 14, 15, 47, 48], "fill": [13, 14, 15], "finger_tip_coord": 34, "fire": 12, "first": [2, 13, 14, 15, 40, 43, 47, 49], "fish": [9, 12], "fish_amount": 12, "fisherman": 9, "fishproba": 9, "fishwood": [3, 12, 47], "fit": 40, "fix": 10, "flag": [4, 17, 18, 19, 23, 24, 25, 35, 39, 48], "flexibl": 47, "float": [40, 48, 49, 50], "float32": [17, 18, 19, 20, 23, 24, 25, 26, 28, 33, 36, 37, 40, 49], "float_stat": [6, 7, 8], "flood": 40, "florian": [2, 41, 44], "folder": [1, 47], "follow": [2, 10, 13, 14, 15, 17, 18, 19, 20, 23, 24, 25, 26, 29, 30, 31, 32, 36, 37, 44, 45, 47, 48], "forc": [17, 19, 26], "forgotten": 47, "fork": 1, "form": 49, "formerli": [2, 43], "forward": [5, 20, 23, 24, 25, 26, 29, 30, 31, 32, 36, 37], "forward_penalti": 5, "forward_reward": 47, "found": 47, "foundat": [13, 14, 15, 47], "four": [3, 12, 34], "frame": 50, "frame_skip": [13, 14, 15], "frameskip": 50, "framework": 43, "from": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 26, 39, 40, 47, 48, 49, 50], "front": 48, "fruit": [3, 12], "fruit_tre": 47, "fuel": [5, 13, 14, 15, 16, 27, 28, 33], "fuel_consumption_penalti": 5, "full": [11, 12, 47], "function": [44, 45, 47], "g": [10, 12, 47], "gamma": [48, 49, 50], "gather": [12, 47], "gem": [4, 12, 39], "gener": [43, 47, 48], "get": 47, "gg": 44, "ghazali": [2, 41, 44], "gif": 47, "gimelfarb": [3, 10], "github": [3, 13, 14, 15, 47], "give": 5, "given": 50, "go": [1, 9, 11, 23, 24, 25, 29, 30, 31, 32], "goal": [10, 12, 29, 30, 31, 32, 33], "goe": 48, "goir": [2, 41, 44], "gold": [4, 12, 39], "gr": [2, 41, 44], "green": 10, "grid": [6, 7, 8], "gridworld": [10, 12], "ground": 4, "group": 47, "gt": 47, "guarante": 43, "guid": [44, 45], "gupta": 5, "gym": [2, 35, 43, 44, 45, 47], "gymnasium": [2, 5, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 42, 43, 44, 45, 46, 48, 49, 50], "ha": [4, 5, 17, 19, 20, 23, 25, 26, 35, 47, 49], "half_cheetah": 20, "halfcheetah": [38, 47], "halfcheetahenv": 20, "harder": 12, "hartmann": 43, "have": [3, 4, 5, 12, 44, 47, 50], "hay": 3, "healthi": [17, 18, 19], "heavili": 50, "height": 38, "help": 3, "here": [3, 10, 44, 45, 47], "high": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 47], "higher": 47, "highwai": [16, 47], "highwayenv": 21, "highwayfastenv": 22, "home": [4, 39], "hopper": [38, 47], "hopperenv": [23, 24, 25], "hotfix": 47, "how": [1, 13, 14, 15, 35, 42, 47], "html": 50, "http": [3, 4, 6, 7, 8, 13, 14, 15, 17, 19, 20, 23, 25, 26, 34, 36, 37, 39, 40, 44, 50], "human": [13, 14, 15, 40], "humanoid": 38, "humanoidenv": 26, "humonoid": 38, "hung": 5, "hydroelectr": 40, "hyperparamet": 43, "i": [1, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 42, 44, 45, 47, 48, 49, 50], "ianleongudri": 47, "id": [17, 19, 23, 25, 48], "idx": 50, "igd": 48, "ijcnn": 40, "illustr": 47, "imag": [13, 14, 15, 16, 40], "image_observ": [13, 14, 15], "impact": 4, "implement": [4, 42, 48], "import": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "improv": 43, "includ": [16, 17, 19, 26, 44, 46], "inconsist": 47, "increment": [13, 14, 15], "incremental_frame_skip": [13, 14, 15], "index": [49, 50], "indic": [4, 10, 39, 47, 49], "inf": [4, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 40], "info": [44, 45, 47, 48, 49, 50], "info_dict": 47, "inform": [1, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 41, 44], "inher": 47, "inherit": 48, "init": 47, "initi": [40, 48], "initial_st": 40, "inproceed": [2, 41, 44], "inspir": 50, "instal": 1, "instanc": [44, 45, 47], "instanti": [17, 19, 23, 25], "instead": [4, 17, 19, 23, 25, 47], "int": [49, 50], "int32": 49, "integ": 48, "integr": 47, "intellig": 2, "interact": [44, 45], "intern": [39, 40], "introduc": [5, 10, 47], "invert": 48, "io": [4, 6, 7, 8, 39, 50], "issu": 47, "itch": [4, 6, 7, 8, 39], "item": [10, 12], "item1": 12, "item2": 12, "item3": 12, "iter": [40, 49], "its": 48, "ivanov": 43, "j": 47, "johnson": 47, "join": [3, 44], "joint": [34, 40], "json": [13, 14, 15], "jump": [23, 24, 25], "kallinteri": 47, "katze2664": 47, "keep": [49, 50], "kei": [4, 49], "kill": [12, 35, 39], "klassert": 4, "known": 48, "kwarg": 48, "l": [2, 41, 44, 49, 50], "lack": 5, "lambda": 49, "land": [5, 27, 28], "lander": [5, 47], "lane": [16, 21], "larger": 4, "last": [49, 50], "leaf": [11, 12], "learn": [2, 4, 9, 10, 39, 41, 43, 44, 45, 47], "left": [4, 6, 7, 8, 10, 11, 13, 14, 15, 39], "length": [49, 50], "length_queu": 49, "leon": 39, "level": [40, 47], "leverag": 43, "librari": [2, 43, 44, 47], "life": 47, "light": 12, "like": [3, 44, 46, 50], "limezu": [4, 39], "limit": 16, "line": 48, "linear": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "linearli": 47, "linearreward": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "linearwrapp": 47, "link": 47, "lint": 47, "list": [4, 47], "literatur": 47, "local": 5, "locat": [4, 12, 34], "logo": 47, "look": 50, "low": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "lower": 10, "luca": [2, 41, 44], "lucasalegr": 47, "lunar": [5, 47], "lunarland": [5, 27, 28], "m": 40, "machin": 39, "made": [1, 47], "mai": 47, "main": [3, 13, 14, 15, 27, 28, 36, 37], "main_engine_fuel": 5, "make": [1, 4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "mani": [13, 14, 15, 49], "map": [6, 7, 8, 10, 12, 13, 14, 15, 47], "mario": [35, 47], "mark": 47, "markov": 40, "master": 50, "match": 47, "mathieu": [3, 40], "max": 50, "max_r": 50, "max_t": 9, "maxandskipenv": 50, "maxima": 5, "maximum": 40, "maze": 10, "md": [1, 47], "mdp": [44, 45, 47], "mean": 50, "merg": [5, 29, 30, 31, 32], "merge_move_penalti": [29, 30, 31, 32], "method": [47, 48], "metric": 48, "mgoulao": 47, "mike": [3, 10], "min": 50, "min_r": 50, "mine": [13, 14, 15], "mine_config": [13, 14, 15], "minecart": [3, 16, 44, 45, 47], "miner": [11, 12], "minerium": [13, 14, 15], "minim": [13, 14, 15, 16], "minor": 47, "mirror": 12, "mirrored_map": [6, 7, 8], "miss": [43, 47], "mistak": 47, "mo": [2, 3, 5, 13, 14, 15, 16, 38, 42, 43, 44, 45, 46, 48, 49, 50], "mo_gym": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 49, 50], "mo_gymnasium": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "mode": [13, 14, 15, 40], "model": [43, 44, 45], "modem": 43, "modifi": 47, "modul": [49, 50], "mofl": 43, "momaxandskipobserv": 47, "momdp": [44, 45, 47], "monormalizereward": 47, "more": [1, 5, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 44, 45], "morecordepisodestatist": 47, "moreov": [48, 49], "morewordstatist": 49, "morl": [3, 6, 7, 8, 9, 44, 45, 47], "most": 49, "mountain": [5, 29, 30, 31, 32, 33, 47], "mountaincar": [5, 33], "mountaincarcontinu": [5, 47], "move": [4, 5, 35, 36, 39, 47, 50], "move_penalti": 5, "much": 35, "mujoco": [17, 19, 20, 23, 25, 26, 34, 36, 37, 44, 46], "multi": [2, 5, 9, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 40, 41, 43, 44, 45, 47, 48], "multibinari": 4, "multiobject": 4, "multipl": [4, 39, 42, 43, 47, 48, 49], "must": [12, 13, 14, 15, 16, 48], "my_env_dir": 48, "my_env_fil": 48, "my_env_v0": 48, "myenv": 48, "mypi": 47, "n": [2, 41, 44], "nO": 40, "narayanan": [12, 39], "ndarrai": 50, "need": 47, "neg": [10, 33, 34], "neighbour": 16, "network": 40, "neural": [40, 41, 44], "neurip": [41, 43, 44], "next": 48, "next_ob": [44, 45, 47], "ninjikin": [4, 39], "nip": 10, "node": 11, "none": [13, 14, 15, 40, 47, 50], "norm": 33, "norm_treasure_env": 50, "normal": [40, 47, 49, 50], "normalized_act": 40, "note": [4, 50], "notebook": [44, 45], "now": [2, 17, 19, 23, 25, 26, 41, 44, 47], "np": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "num": 49, "num_env": 49, "number": [4, 40], "numpi": [44, 45, 47, 48], "nutri1": 12, "nutri6": 12, "nutrient": [11, 12], "ob": [5, 12, 16, 38, 44, 45, 47, 49], "object": [2, 5, 9, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 40, 41, 43, 44, 45, 47, 48], "observ": [12, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 47, 48, 50], "observation_spac": 48, "observationspac": 47, "obstyp": 50, "off": 47, "oject": 48, "onc": 1, "one": [44, 46, 47, 50], "onli": [40, 50], "open": [43, 44], "opengameart": 40, "optim": [39, 43, 47], "option": [29, 30, 31, 32, 44, 45, 47, 48], "order": 47, "ore1": 16, "ore2": 16, "ores": [13, 14, 15, 16], "org": [17, 19, 20, 23, 25, 26, 34, 36, 37, 40, 44], "orient": [13, 14, 15], "origin": [4, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "other": [16, 17, 18, 19, 20, 23, 24, 25, 44, 45, 47, 50], "otherwis": [4, 9, 35], "our": [1, 47, 48], "out": [3, 40], "outcom": 4, "output": 49, "packag": [1, 47], "paper": 4, "pareto": [43, 48], "pareto_front": [47, 48], "parisi": 40, "part": [47, 48], "pass": [35, 47], "passag": 10, "path": [13, 14, 15], "paulina": 40, "penal": 40, "penalti": [4, 5, 6, 7, 8, 12, 29, 30, 31, 32, 33, 35], "peopl": 3, "percentag": 40, "perform": [47, 48], "person": 43, "pf": 47, "pianosi": [16, 40], "pick": 4, "pip": [1, 44, 46], "pixel": [4, 6, 7, 8, 47], "plan": [44, 45], "pleas": [41, 43, 44], "plu": 10, "point": 35, "polici": [39, 43], "porcentag": [13, 14, 15], "port": 40, "posit": [5, 6, 7, 8, 10, 13, 14, 15, 34, 35, 39], "possibl": [4, 34], "potenti": [4, 12, 47], "pp": 40, "practic": [44, 45], "pranav": 5, "pranavg23": 47, "pre": 47, "predefin": 47, "prefer": 47, "prevent": 5, "previous": 47, "priorit": 43, "prob_drop": 4, "probabl": [4, 9], "problem": [4, 6, 7, 8, 9, 40, 47], "problemat": [44, 46], "proceed": [2, 39, 41, 44], "process": [41, 44], "product": 50, "project": 3, "protein": [11, 12], "provid": [3, 9, 44, 47, 49], "pseudo": 47, "public": [2, 44], "publish": 43, "pull": [43, 48], "py": [47, 48], "pydoc": 47, "pypi": 47, "pytest": 48, "python": [44, 45, 47], "q": 40, "qld": 40, "qualiti": 47, "quantiti": [13, 14, 15], "question": 3, "r": [1, 49, 50], "r_i": 34, "randint": 47, "random": 40, "rang": [47, 49], "rather": 4, "reach": [3, 6, 7, 8, 10, 11, 12, 16, 29, 30, 31, 32, 33, 35, 47], "reacher": 38, "read": 5, "readm": 47, "readthedoc": 50, "reason": 5, "rebuild": 1, "receiv": [11, 47], "recent": 49, "recov": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "red": 10, "refactor": [3, 13, 14, 15], "refer": 48, "registr": 48, "registri": 48, "reinforc": [2, 4, 9, 10, 41, 43, 44, 45, 47], "reinject": 50, "relax": [2, 41, 44], "releas": [16, 40], "reli": 47, "reliabl": [41, 43, 44], "remov": [29, 30, 31, 32], "remove_move_penalti": [29, 30, 31, 32], "renam": 47, "render": [13, 14, 15, 40, 48], "render_mod": [13, 14, 15, 40], "repeat": [13, 14, 15], "repositori": [41, 42, 44, 48], "repres": 47, "request": 43, "requir": 1, "research": [41, 43, 44], "reservoir": [3, 16, 47], "reset": [44, 45, 47, 48, 49, 50], "resourc": [12, 47], "respect": 49, "restelli": 40, "retriev": [13, 14, 15], "return": [9, 13, 14, 15, 39, 44, 47, 48, 50], "return_queu": 49, "revamp": 47, "revers": [4, 5, 29, 30, 31, 32], "reverse_penalti": 5, "reward": [5, 22, 44, 45, 47, 48, 49, 50], "reward_dim": 48, "reward_spac": [47, 48], "reymond": [3, 40], "rgb": [13, 14], "rgb_arrai": [13, 14, 15, 40], "right": [4, 6, 7, 8, 10, 11, 13, 14, 15, 21, 39], "right_lan": 16, "rightest": 16, "riva": 40, "rl": 47, "rnd": 47, "robert": 4, "rodriguez": 43, "roijer": 12, "room": [3, 12], "root": [11, 47], "run": [20, 26, 37, 48, 49], "runzheyang": 3, "safeti": 4, "same": [6, 7, 8], "sampl": [43, 49], "save": 47, "scalar": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 50], "scale": [20, 26], "scenario": 47, "scott": 47, "sea": [3, 12, 49, 50], "sebimarkgraf": 47, "second": [13, 14, 15], "section": 4, "see": [10, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 44, 45, 47, 48], "seed": [48, 49], "select": 40, "self": [47, 48], "sens": 50, "separ": [10, 17, 19, 23, 25], "serenevillagerevamp": [4, 39], "serial": 49, "server": [3, 44], "set": [17, 18, 19, 23, 24, 25, 44, 47, 48], "setup": 47, "shape": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 48, 49], "shaped_reward": 5, "should": [47, 48], "shown": 47, "side": [27, 28], "side_engine_fuel": 5, "signal": 5, "silva": [2, 41, 44], "similar": [38, 47, 49], "similarli": [5, 16], "simon": 40, "simpl": [9, 44, 45], "simpli": 3, "sin": [13, 14, 15, 34], "sinc": [48, 49, 50], "singl": [29, 30, 31, 32, 47], "size": [4, 11, 48], "skip": 50, "sky": 40, "small": [4, 47], "smooth": 50, "snippet": 47, "so": 4, "some": [3, 44, 46, 48], "soto": 43, "sourc": [6, 7, 8, 10, 12, 13, 14, 15, 33, 44], "space": [5, 12, 16, 22, 38, 47, 48], "spars": [13, 14, 15], "specif": 49, "specifi": 4, "speed": [5, 13, 14, 15, 16, 21, 29, 30, 31, 32, 47], "speed_object": 5, "spell": 47, "sphinx": 1, "split": 10, "squar": 10, "srini": 39, "stabil": 50, "stabl": [47, 50], "stable_baselines3": 50, "stai": 16, "standard": [44, 47, 50], "static": 5, "statist": 49, "stats_kei": [49, 50], "steckelmach": [3, 9], "step": [4, 5, 6, 7, 8, 9, 29, 30, 31, 32, 33, 35, 40, 43, 44, 45, 47, 48, 49], "store": 49, "str": [49, 50], "structur": 47, "sub": 49, "submarin": [6, 7, 8, 12], "submiss": 43, "subpackag": 47, "successfulli": [27, 28], "successor": [3, 10], "suit": 44, "super": 35, "supermario": [3, 16], "supermariobro": 35, "supermariobrosenv": 16, "suppli": 40, "support": 16, "swimmer": 38, "swimmerenv": 36, "system": [41, 44, 46], "t": [49, 50], "tailor": 47, "take": [4, 12], "taken": 12, "talbi": [2, 41, 44], "target": 34, "target_1": 38, "target_2": 38, "target_3": 38, "target_4": 38, "target_i": 34, "taxonomi": 43, "termin": [44, 45, 47, 48, 49], "th": 50, "than": 4, "thank": 3, "thei": [47, 49, 50], "them": [3, 4, 5, 44, 45], "therefor": 11, "thi": [1, 4, 41, 44, 45, 46, 47, 48, 49, 50], "those": 10, "thought": 47, "three": [12, 47], "threshold": 40, "thrill": 47, "through": 48, "thu": 47, "ti": 48, "time": [1, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 29, 30, 31, 32, 33, 35, 49, 50], "time_limit": 40, "time_penalti": [4, 5, 12], "timemov": 5, "timespe": 5, "timondesch": 47, "tip": 34, "titl": [2, 41, 44], "tomekst": 47, "tool": 47, "toolkit": [41, 43, 44], "top": [29, 30, 31, 32, 33], "torqu": 34, "touch": 50, "track": [49, 50], "trade": 47, "train": 50, "transfer": [3, 10], "transform": 47, "travel": 10, "treasur": [3, 4, 12, 39, 49, 50], "tree": [3, 12, 40], "triangl": 10, "true": [4, 6, 7, 8, 13, 14, 15, 40, 49], "truncat": [40, 44, 45, 47, 48, 49], "tuto": 47, "tutori": 48, "two": [9, 13, 14, 15, 16, 34, 35, 40, 50], "txt": 1, "type": [12, 13, 14, 15, 16, 47], "u": 3, "unbreakable_bottl": 4, "unbreakablebottl": 4, "under": [42, 47], "underwat": [6, 7, 8], "unpin": 47, "until": 40, "unwrap": 47, "up": [4, 6, 7, 8, 10, 39, 40], "upper": [13, 14, 15], "upstream": 40, "us": [6, 7, 8, 13, 14, 15, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "usag": 47, "user": 47, "util": [9, 47], "v0": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 21, 22, 29, 30, 31, 32, 33, 35, 38, 39, 40, 44, 45, 49, 50], "v2": [5, 47], "v3": [27, 28, 47], "v4": [17, 18, 19, 20, 23, 24, 25, 26, 34, 38, 47], "v5": [17, 19, 20, 23, 25, 26, 34, 36, 37], "valu": [4, 6, 7, 8, 11, 12, 43], "vamplew": [5, 12], "variabl": 49, "variou": [3, 42], "vecenv": 47, "vector": [10, 11, 13, 14, 15, 29, 30, 31, 32, 33, 35, 44, 47, 48, 50], "vector_reward": [44, 45, 47], "vectorenv": 49, "vectori": 47, "vehicl": 16, "veloc": [17, 18, 19, 26, 34, 36, 37, 38], "veri": [44, 45, 48], "version": [5, 10, 12, 16, 18, 21, 22, 24, 27, 28, 29, 30, 31, 32, 33, 35, 38, 47], "via": [17, 19, 23, 25, 43, 49], "vitamin": [11, 12], "wa": [3, 4, 5, 6, 7, 8, 13, 14, 15, 43, 47], "wai": [3, 10], "walker2d": 38, "walker2denv": 37, "wall": 10, "want": 3, "warn": [16, 47], "water": [3, 11, 12, 16, 47], "we": [3, 44, 47, 48], "websit": [44, 47], "weight": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 50], "welfar": 43, "well": [44, 47, 48], "were": 10, "when": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 35, 39, 47, 48], "where": [6, 7, 8, 9, 11, 29, 30, 31, 32, 33, 47], "whether": [13, 14, 15, 40], "which": [4, 5, 6, 7, 8, 9, 10, 44, 47, 48, 49, 50], "while": [4, 10, 12, 16], "within": [47, 48, 49], "without": [17, 19, 23, 25], "wood": [9, 12], "wood_amount": 12, "woodproba": 9, "work": [44, 49], "worker": 47, "workshop": [2, 43], "world": [6, 7, 8], "would": 3, "wrap": [47, 49], "wrapped_env": 49, "wrapper": [42, 44, 45, 47], "wrt": 40, "x": [6, 7, 8, 17, 18, 19, 23, 24, 25, 26, 35, 36, 37, 39], "x_po": 16, "x_veloc": [38, 47], "xu": 38, "y": [6, 7, 8, 17, 18, 19, 39], "y_veloc": 38, "yang": [6, 7, 8, 11, 12, 16], "year": [2, 41, 44], "you": [3, 41, 44, 45, 46, 47, 48], "your": [1, 41, 44], "your_ag": [44, 45, 47], "z": [23, 24, 25], "zero": [34, 47]}, "titles": ["404 - Page Not Found", "MO-Gymnasium documentation", "<no title>", "Community", "Breakable-Bottles", "Classic Control", "Deep-Sea-Treasure", "Deep-Sea-Treasure-Concave", "Deep-Sea-Treasure-Mirrored", "Fishwood", "Four-Room", "Fruit-Tree", "Grid-World", "Minecart", "Minecart-Deterministic", "Minecart-Rgb", "Miscellaneous", "MO-Ant", "MO-Ant-2D", "MO-Ant-2Obj", "MO-Halfcheetah", "MO-Highway", "MO-Highway-Fast", "MO-Hopper", "MO-Hopper-2D", "MO-Hopper-2Obj", "MO-Humanoid", "MO-Lunar-Lander", "MO-Lunar-Lander-Continuous", "MO-Mountaincar", "MO-Mountaincar-3D", "MO-Mountaincar-Timemove", "MO-Mountaincar-Timespeed", "MO-Mountaincarcontinuous", "MO-Reacher", "MO-Supermario", "MO-Swimmer", "MO-Walker2D", "MuJoCo", "Resource-Gathering", "Water-Reservoir", "Citation", "MORL Baselines", "List of Publications", "API", "API", "Install", "Release Notes", "Creating a custom environment", "Vector Wrappers", "Wrappers"], "titleterms": {"0": 47, "1": [47, 48], "2": [47, 48], "29": 47, "2d": [18, 24], "2obj": [19, 25], "3": [47, 48], "3d": 30, "4": [47, 48], "404": 0, "Not": 0, "The": 0, "acknowledg": 3, "action": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 34, 39, 40], "ant": [17, 18, 19], "api": [44, 45], "argument": [4, 6, 7, 8, 9, 10, 13, 14, 15, 40], "baselin": 42, "becom": 47, "better": 47, "bottl": [4, 47], "breakabl": [4, 47], "bug": 47, "build": 1, "citat": 41, "cite": 44, "class": 48, "classic": 5, "commun": 3, "concav": 7, "continu": 28, "control": 5, "could": 0, "creat": 48, "credit": [4, 6, 7, 8, 9, 10, 13, 14, 15, 39, 40], "custom": 48, "deep": [6, 7, 8, 47], "descript": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 39, 40], "determinist": 14, "document": [1, 47], "environ": [47, 48], "episod": [4, 6, 7, 8, 10, 11, 13, 14, 15, 35, 39], "evalu": 47, "fast": 22, "fishwood": 9, "fix": 47, "found": 0, "four": 10, "front": 47, "fruit": [11, 47], "gather": 39, "grid": 12, "gymnasium": [1, 47], "halfcheetah": 20, "highwai": [21, 22], "histori": [17, 19, 20, 23, 25, 26, 34, 36, 37], "hopper": [23, 24, 25], "humanoid": 26, "improv": 47, "instal": [44, 46], "instanti": 48, "known": 47, "lander": [27, 28], "linearreward": 50, "list": 43, "lunar": [27, 28], "matur": 47, "migrat": 47, "minecart": [13, 14, 15], "mirror": [8, 47], "miscellan": 16, "mo": [1, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 47], "moclipreward": 50, "momaxandskipobserv": 50, "monormalizereward": 50, "more": 47, "morecordepisodestatist": [49, 50], "morl": 42, "mosyncvectorenv": 49, "mountaincar": [29, 30, 31, 32, 47], "mountaincarcontinu": 33, "mujoco": [38, 47], "new": [47, 48], "note": 47, "observ": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 34, 39, 40], "page": [0, 47], "pareto": 47, "polici": 47, "public": 43, "pygam": 47, "reacher": [34, 47], "refer": 10, "regist": 48, "releas": 47, "render": 47, "request": 0, "reservoir": 40, "resourc": 39, "reward": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "rgb": 15, "room": 10, "sea": [6, 7, 8, 47], "space": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "start": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 39, 40], "state": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 39, 40], "supermario": 35, "support": 47, "swimmer": 36, "termin": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 35, 39], "test": [47, 48], "timemov": 31, "timespe": 32, "treasur": [6, 7, 8, 47], "tree": [11, 47], "updat": 47, "v0": 47, "v1": 47, "vector": 49, "version": [17, 19, 20, 23, 25, 26, 34, 36, 37], "walker2d": 37, "water": 40, "webpag": 47, "world": 12, "wrapper": [49, 50], "your": 48}}) \ No newline at end of file +Search.setIndex({"alltitles": {"0.1.1": [[47, "release-0-1-1"]], "0.1.2": [[47, "release-0-1-2"]], "0.2.0": [[47, "release-0-2-0"]], "0.2.1": [[47, "release-0-2-1"]], "1. Create a new environment class": [[48, "create-a-new-environment-class"]], "2. Register the environment": [[48, "register-the-environment"]], "3. Test the environment": [[48, "test-the-environment"]], "4. Instantiate your environment": [[48, "instantiate-your-environment"]], "404 - Page Not Found": [[0, null]], "API": [[44, null], [45, null]], "Acknowledgements": [[3, "acknowledgements"]], "Action Space": [[4, "action-space"], [6, "action-space"], [7, "action-space"], [8, "action-space"], [9, "action-space"], [10, "action-space"], [11, "action-space"], [13, "action-space"], [14, "action-space"], [15, "action-space"], [34, "action-space"], [39, "action-space"], [40, "action-space"]], "Arguments": [[4, "arguments"], [6, "arguments"], [7, "arguments"], [8, "arguments"], [9, "arguments"], [10, "arguments"], [13, "arguments"], [14, "arguments"], [15, "arguments"], [40, "arguments"]], "Breakable-Bottles": [[4, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Citation": [[41, null]], "Citing": [[44, "citing"]], "Classic Control": [[5, null]], "Community": [[3, null]], "Creating a custom environment": [[48, null]], "Credits": [[4, "credits"], [6, "credits"], [7, "credits"], [8, "credits"], [9, "credits"], [10, "credits"], [13, "credits"], [14, "credits"], [15, "credits"], [39, "credits"], [40, "credits"]], "Deep-Sea-Treasure": [[6, null]], "Deep-Sea-Treasure-Concave": [[7, null]], "Deep-Sea-Treasure-Mirrored": [[8, null]], "Description": [[4, "description"], [6, "description"], [7, "description"], [8, "description"], [9, "description"], [10, "description"], [11, "description"], [13, "description"], [14, "description"], [15, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [21, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [27, "description"], [28, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [39, "description"], [40, "description"]], "Episode Termination": [[4, "episode-termination"], [6, "episode-termination"], [7, "episode-termination"], [8, "episode-termination"], [10, "episode-termination"], [11, "episode-termination"], [13, "episode-termination"], [14, "episode-termination"], [15, "episode-termination"], [35, "episode-termination"], [39, "episode-termination"]], "Fishwood": [[9, null]], "Four-Room": [[10, null]], "Fruit-Tree": [[11, null]], "Grid-World": [[12, null]], "Install": [[44, "install"], [46, null]], "LinearReward": [[50, "linearreward"]], "List of Publications": [[43, null]], "MO-Ant": [[17, null]], "MO-Ant-2D": [[18, null]], "MO-Ant-2Obj": [[19, null]], "MO-Gymnasium 0.3.0 Release: Migrate to Gymnasium": [[47, "release-0-3-0"]], "MO-Gymnasium 0.3.1 Release: Improved documentation and MuJoco MO-Reacher environment": [[47, "release-0-3-1"]], "MO-Gymnasium 0.3.2 Release: Bug fixes, improved webpage": [[47, "release-0-3-2"]], "MO-Gymnasium documentation": [[1, null]], "MO-Halfcheetah": [[20, null]], "MO-Highway": [[21, null]], "MO-Highway-Fast": [[22, null]], "MO-Hopper": [[23, null]], "MO-Hopper-2D": [[24, null]], "MO-Hopper-2Obj": [[25, null]], "MO-Humanoid": [[26, null]], "MO-Lunar-Lander": [[27, null]], "MO-Lunar-Lander-Continuous": [[28, null]], "MO-Mountaincar": [[29, null]], "MO-Mountaincar-3D": [[30, null]], "MO-Mountaincar-Timemove": [[31, null]], "MO-Mountaincar-Timespeed": [[32, null]], "MO-Mountaincarcontinuous": [[33, null]], "MO-Reacher": [[34, null]], "MO-Supermario": [[35, null]], "MO-Swimmer": [[36, null]], "MO-Walker2D": [[37, null]], "MOClipReward": [[50, "moclipreward"]], "MOMaxAndSkipObservation": [[50, "momaxandskipobservation"]], "MONormalizeReward": [[50, "monormalizereward"]], "MORL Baselines": [[42, null]], "MORecordEpisodeStatistics": [[49, "morecordepisodestatistics"], [50, "morecordepisodestatistics"]], "MOSyncVectorEnv": [[49, "mosyncvectorenv"]], "Minecart": [[13, null]], "Minecart-Deterministic": [[14, null]], "Minecart-Rgb": [[15, null]], "Miscellaneous": [[16, null]], "MuJoCo": [[38, null]], "Observation Space": [[4, "observation-space"], [6, "observation-space"], [7, "observation-space"], [8, "observation-space"], [9, "observation-space"], [10, "observation-space"], [11, "observation-space"], [13, "observation-space"], [14, "observation-space"], [15, "observation-space"], [34, "observation-space"], [39, "observation-space"], [40, "observation-space"]], "References": [[10, "references"]], "Release Notes": [[47, null]], "Resource-Gathering": [[39, null]], "Reward Space": [[4, "reward-space"], [6, "reward-space"], [7, "reward-space"], [8, "reward-space"], [9, "reward-space"], [10, "reward-space"], [11, "reward-space"], [13, "reward-space"], [14, "reward-space"], [15, "reward-space"], [17, "reward-space"], [18, "reward-space"], [19, "reward-space"], [20, "reward-space"], [21, "reward-space"], [23, "reward-space"], [24, "reward-space"], [25, "reward-space"], [26, "reward-space"], [27, "reward-space"], [28, "reward-space"], [34, "reward-space"], [35, "reward-space"], [36, "reward-space"], [37, "reward-space"], [39, "reward-space"], [40, "reward-space"]], "Reward space:": [[29, "reward-space"], [30, "reward-space"], [31, "reward-space"], [32, "reward-space"], [33, "reward-space"]], "Starting State": [[4, "starting-state"], [6, "starting-state"], [7, "starting-state"], [8, "starting-state"], [9, "starting-state"], [10, "starting-state"], [11, "starting-state"], [13, "starting-state"], [14, "starting-state"], [15, "starting-state"], [39, "starting-state"], [40, "starting-state"]], "Termination": [[9, "termination"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Vector Wrappers": [[49, null]], "Version History": [[17, "version-history"], [19, "version-history"], [20, "version-history"], [23, "version-history"], [25, "version-history"], [37, "version-history"]], "Version History:": [[26, "version-history"], [34, "version-history"], [36, "version-history"]], "Water-Reservoir": [[40, null]], "Wrappers": [[50, null]], "v0.3.3: MO-Gymnasium 0.3.3 Release: Policy Evaluation bug fix, better documentation page": [[47, "release-v0-3-3"]], "v0.3.4: MO-Gymnasium 0.3.4 Release: Known Pareto Front, improved renders and documentation": [[47, "release-v0-3-4"]], "v1.0.0: MO-Gymnasium becomes mature": [[47, "release-v1-0-0"]], "v1.0.1: MO-Gymnasium 1.0.1 Release: Support Gymnasium 0.29, breakable-bottles pygame render, and more": [[47, "release-v1-0-1"]], "v1.1.0: MO-Gymnasium 1.1.0 Release: New MuJoCo environments, Mirrored Deep Sea Treasure, Fruit Tree rendering, and more": [[47, "release-v1-1-0"]], "v1.2.0: MO-Gymnasium 1.2.0 Release: Update Gymnasium to v1.0.0, New Mountaincar Environments, Documentation and Test Improvements, and more": [[47, "release-v1-2-0"]], "v1.3.0: MO-Gymnasium 1.3.0 Release: New Mujoco v5 Environments": [[47, "release-v1-3-0"]]}, "docnames": ["404", "README", "citing/citing", "community/community", "environments/breakable-bottles", "environments/classical", "environments/deep-sea-treasure", "environments/deep-sea-treasure-concave", "environments/deep-sea-treasure-mirrored", "environments/fishwood", "environments/four-room", "environments/fruit-tree", "environments/grid-world", "environments/minecart", "environments/minecart-deterministic", "environments/minecart-rgb", "environments/misc", "environments/mo-ant", "environments/mo-ant-2d", "environments/mo-ant-2obj", "environments/mo-halfcheetah", "environments/mo-highway", "environments/mo-highway-fast", "environments/mo-hopper", "environments/mo-hopper-2d", "environments/mo-hopper-2obj", "environments/mo-humanoid", "environments/mo-lunar-lander", "environments/mo-lunar-lander-continuous", "environments/mo-mountaincar", "environments/mo-mountaincar-3d", "environments/mo-mountaincar-timemove", "environments/mo-mountaincar-timespeed", "environments/mo-mountaincarcontinuous", "environments/mo-reacher", "environments/mo-supermario", "environments/mo-swimmer", "environments/mo-walker2d", "environments/mujoco", "environments/resource-gathering", "environments/water-reservoir", "examples/citation", "examples/morl_baselines", "examples/publications", "index", "introduction/api", "introduction/install", "release_notes", "tutorials/custom_env", "wrappers/vector_wrappers", "wrappers/wrappers"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["404.md", "README.md", "citing/citing.md", "community/community.md", "environments/breakable-bottles.md", "environments/classical.md", "environments/deep-sea-treasure.md", "environments/deep-sea-treasure-concave.md", "environments/deep-sea-treasure-mirrored.md", "environments/fishwood.md", "environments/four-room.md", "environments/fruit-tree.md", "environments/grid-world.md", "environments/minecart.md", "environments/minecart-deterministic.md", "environments/minecart-rgb.md", "environments/misc.md", "environments/mo-ant.md", "environments/mo-ant-2d.md", "environments/mo-ant-2obj.md", "environments/mo-halfcheetah.md", "environments/mo-highway.md", "environments/mo-highway-fast.md", "environments/mo-hopper.md", "environments/mo-hopper-2d.md", "environments/mo-hopper-2obj.md", "environments/mo-humanoid.md", "environments/mo-lunar-lander.md", "environments/mo-lunar-lander-continuous.md", "environments/mo-mountaincar.md", "environments/mo-mountaincar-3d.md", "environments/mo-mountaincar-timemove.md", "environments/mo-mountaincar-timespeed.md", "environments/mo-mountaincarcontinuous.md", "environments/mo-reacher.md", "environments/mo-supermario.md", "environments/mo-swimmer.md", "environments/mo-walker2d.md", "environments/mujoco.md", "environments/resource-gathering.md", "environments/water-reservoir.md", "examples/citation.md", "examples/morl_baselines.md", "examples/publications.md", "index.md", "introduction/api.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "wrappers/vector_wrappers.md", "wrappers/wrappers.md"], "indexentries": {"linearreward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.LinearReward", false]], "moclipreward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MOClipReward", false]], "momaxandskipobservation (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MOMaxAndSkipObservation", false]], "monormalizereward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MONormalizeReward", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MORecordEpisodeStatistics", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers.vector)": [[49, "mo_gymnasium.wrappers.vector.MORecordEpisodeStatistics", false]], "mosyncvectorenv (class in mo_gymnasium.wrappers.vector)": [[49, "mo_gymnasium.wrappers.vector.MOSyncVectorEnv", false]]}, "objects": {"mo_gymnasium.wrappers": [[50, 0, 1, "", "LinearReward"], [50, 0, 1, "", "MOClipReward"], [50, 0, 1, "", "MOMaxAndSkipObservation"], [50, 0, 1, "", "MONormalizeReward"], [50, 0, 1, "", "MORecordEpisodeStatistics"]], "mo_gymnasium.wrappers.vector": [[49, 0, 1, "", "MORecordEpisodeStatistics"], [49, 0, 1, "", "MOSyncVectorEnv"]]}, "objnames": {"0": ["py", "class", "Python class"]}, "objtypes": {"0": "py:class"}, "terms": {"": [4, 5, 6, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 37, 44, 45, 47, 50], "0": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 49, 50], "01": 47, "02": 47, "03": 47, "06": 47, "07": [29, 30, 31, 32, 33], "08": [47, 50], "09": 47, "1": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 49, 50], "10": [6, 7, 8, 11, 12, 27, 28, 39, 40, 47], "100": [27, 28, 35, 47, 49, 50], "101": 47, "103": 47, "105": [17, 19, 47], "106": 47, "107": 47, "108": 47, "109": 47, "11": [6, 7, 23, 24, 25, 47], "1109": 40, "1145": 39, "12": 47, "124": [7, 8], "13": [10, 47], "1390156": 39, "1390162": 39, "14": [10, 47], "16": 47, "160": 40, "17": [20, 26, 37], "18": 47, "19": 47, "1e": [23, 25, 36, 37, 50], "2": [4, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 49], "20": [8, 47], "200": 9, "2008": [12, 39], "2010": 12, "2011": 5, "2012": 40, "2013": 16, "2017": 10, "2018": 12, "2019": [6, 7, 8, 11, 12, 13, 14, 15, 16], "2020": 38, "2021": 12, "2022": [2, 5, 12, 43, 47], "2022bnaic": 2, "2023": [41, 43, 44, 47], "2024": [43, 47], "21": 47, "23": [6, 47], "24": 47, "240": [4, 35], "25": [26, 35, 47], "255": [15, 35], "256": 35, "25th": 39, "26": 47, "27": [18, 47], "28": [27, 28, 47], "2d": [6, 7, 8, 10, 13, 14, 15, 17, 19, 23, 25, 33, 47, 49], "2obj": [17, 23, 47], "3": [4, 6, 7, 8, 10, 13, 14, 15, 17, 18, 19, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 35, 37, 39, 40, 49], "30": 47, "31": 47, "33": 47, "34": 47, "348": 26, "34th": 2, "35": 47, "360": 4, "37": 47, "37th": [41, 44], "3d": [5, 13, 14, 15, 29, 31, 32], "4": [4, 6, 7, 8, 10, 13, 14, 15, 26, 27, 28, 34, 35, 36, 39, 40, 49, 50], "40": 47, "41": [39, 47], "42": [47, 49], "43": 47, "45": 47, "46": 47, "47": [39, 47], "480": 15, "5": [4, 11, 12, 13, 14, 15, 21, 22, 27, 28, 35, 39, 47], "50": [4, 47], "51": 47, "52": 47, "53": 47, "55": 47, "56": 47, "57": 47, "58": 47, "59": 47, "6": [11, 12, 13, 14, 15, 20, 27, 28, 29, 30, 31, 32, 33, 34, 37], "60": 47, "61": 47, "62": 47, "6252759": 40, "63": 11, "64": 47, "65": 47, "67": 47, "69": 47, "7": [6, 11, 12, 13, 14, 15, 47, 49], "70": 47, "72": 47, "73": 47, "74": 47, "75": 47, "76": 47, "77": 47, "79": 47, "8": [17, 18, 19, 27, 28, 36, 40, 44, 45, 47], "80": 47, "81": 47, "83": 47, "84": 47, "85": 47, "86": 47, "87": 47, "89": 47, "9": 34, "90": 47, "91": 47, "92": 47, "93": 47, "94": 47, "95": 47, "97": 47, "99": [47, 50], "A": [2, 4, 10, 16, 17, 18, 19, 22, 23, 25, 29, 30, 31, 32, 33, 40, 41, 43, 44, 45, 50], "As": [4, 44, 45], "At": 49, "But": 50, "By": [29, 30, 31, 32, 40], "For": [1, 34, 44, 45, 47, 49], "If": [3, 13, 14, 15, 17, 18, 19, 23, 24, 25, 40, 41, 44, 48], "In": [4, 47], "It": [42, 44, 45, 47, 48], "Of": 47, "The": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 33, 34, 35, 36, 37, 39, 40, 44, 47, 48, 49], "There": 40, "To": [1, 6, 7, 8, 44, 46], "With": 47, "_": 49, "__init__": 48, "_build": 1, "_episod": 49, "_forward_reward_weight": 47, "_modul": 50, "aama": 43, "abel": [13, 14, 15, 16], "about": [1, 5], "abov": 4, "acceler": [13, 14, 15], "accept": 47, "access": [47, 49], "account": [4, 12], "achiev": 47, "act": [44, 45, 47], "action": [5, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 47, 48, 49], "action_spac": [48, 49], "acttyp": 50, "ad": [17, 18, 19, 23, 24, 25, 47, 48, 49], "adapt": [6, 7, 8, 10], "add": [29, 30, 31, 32, 43, 47], "add_speed_object": [29, 30, 31, 32], "addit": 5, "addition": 47, "after": [9, 47, 50], "again": 4, "agent": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 39, 40, 47], "ai": 4, "al": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 38, 43], "alegr": [2, 12, 41, 43, 44], "algorithm": [42, 44], "align": 43, "all": [3, 17, 18, 19, 39, 44, 46, 47, 49, 50], "allow": 47, "also": [3, 16, 44, 45, 47], "altern": [29, 30, 31, 32], "alwai": [6, 7, 8], "amount": [16, 40], "amp": 47, "an": [5, 10, 29, 30, 31, 32, 35, 39, 40, 44, 45, 47, 48, 50], "ana": [2, 41, 44], "andrea": 47, "andr\u00e9": 10, "angl": 34, "angular": 34, "ani": 49, "ann": [2, 41, 44], "ansi": 40, "ansimuz": [6, 7, 8], "ant": [38, 47], "antenv": [17, 18, 19], "api": [42, 47, 48], "appear": 2, "appli": [4, 34, 49], "approach": 4, "approxim": 43, "ar": [3, 4, 13, 14, 15, 16, 39, 40, 47, 48, 49, 50], "arm": 34, "arrai": [10, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 48, 49, 50], "art": [4, 6, 7, 8, 47], "artifici": 2, "asid": 3, "ask": 3, "asset": [4, 39, 47], "assist": [4, 6, 7, 8], "associ": 47, "atari_wrapp": 50, "attribut": 48, "australia": 40, "author": [2, 41, 44], "autobuild": 1, "automat": [1, 47, 48], "avail": [47, 49, 50], "averag": 50, "avoid": [10, 16], "axel": [13, 14, 15], "axelabel": 3, "axi": [23, 24, 25], "b": 1, "back": 47, "background": [6, 7, 8, 40], "backward": 5, "balanc": 47, "barret": 12, "barreto": 10, "barrett": 39, "base": [3, 4, 13, 14, 15, 34, 40, 43, 47, 50], "baselin": 47, "baselines3": 50, "batteri": 47, "bazzan": [2, 41, 44], "becaus": 4, "been": [4, 5, 47], "befor": 49, "begin": [49, 50], "behind": 5, "benchmark": [41, 43, 44], "benefit": 47, "benelearn": 2, "benelux": 2, "between": [35, 40, 44, 47, 50], "bib": 47, "binari": [10, 11, 12], "blob": [13, 14, 15], "blue": 10, "bnaic": [2, 43], "bnj6kubtg6": 44, "booktitl": [2, 41, 44], "bool": 49, "boolean": [4, 49], "both": 50, "both_norm_env": 50, "bottl": 12, "bottle_reward": 4, "bottles_carri": 4, "bottles_deliv": [4, 12], "bottles_drop": 4, "bound": [40, 47], "box": [6, 7, 8, 17, 18, 19, 20, 23, 24, 25, 26, 28, 33, 36, 37, 40], "brake": [13, 14, 15], "break": 47, "breakabl": 12, "breakablebottl": 4, "brisban": 40, "bro": 35, "bruno": [2, 41, 44], "budget": 43, "buffer": 49, "buffer_length": [49, 50], "bugfix": 47, "bump": 47, "button": 47, "c": [2, 41, 44], "cai": 43, "calcul": 4, "call": 47, "callabl": 49, "can": [3, 4, 9, 11, 13, 14, 15, 17, 19, 23, 25, 29, 30, 31, 32, 40, 44, 45, 46, 47, 49, 50], "cannot": 4, "capabl": 47, "capac": [13, 14, 15], "car": [5, 29, 30, 31, 32, 47], "carb": [11, 12], "care": 49, "carri": 4, "cart": [13, 14, 15], "castelletti": 40, "catch": 9, "caus": 47, "cc": 47, "cd": 1, "cell": 12, "central": 34, "certain": [44, 46], "chanc": 12, "chang": [1, 6, 7, 8, 20, 26, 29, 30, 31, 32, 47], "changelog": 47, "check": [44, 45, 47], "chose": 11, "ci": 47, "circl": 10, "citat": 47, "cite": 41, "class": [5, 44, 45, 49, 50], "classic": [6, 7, 8, 48], "clip": 50, "close": 48, "co": [13, 14, 15, 34], "code": [3, 6, 7, 8, 9, 10, 13, 14, 15, 40, 47, 50], "coin": [16, 35], "colab": [44, 45], "collect": [9, 10, 11, 12, 13, 14, 15, 16, 35, 39, 47], "collis": [16, 21], "com": [3, 13, 14, 15], "combin": 47, "commit": 47, "common": 50, "commun": [44, 47], "compar": 44, "complet": 50, "compliant": 44, "compon": [10, 47, 50], "compromis": 47, "comput": [34, 47, 48], "concav": [12, 47], "concave_map": [6, 7, 8], "conduct": 47, "confer": [2, 39, 40, 41, 44], "config": [13, 14, 15], "configur": [13, 14, 15], "conflict": 47, "conor": 3, "consequ": 47, "consist": 39, "constructor": 48, "consum": [13, 14, 15], "consumpt": [5, 13, 14, 15, 16], "contact": [17, 19, 26], "contain": [1, 4, 10, 11, 12, 13, 14, 15, 29, 30, 31, 32, 33, 34, 42], "content": 40, "context": 47, "continu": [5, 6, 7, 8, 16, 33, 38, 40, 47], "contribut": [1, 3, 4, 47], "contributor": [3, 47], "control": [6, 7, 8, 9, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "control_cost": 47, "converg": 5, "convers": 47, "convex": [6, 7, 8], "coordin": [6, 7, 8, 39, 44], "copi": 49, "corner": [13, 14, 15], "correct": 47, "correspond": [16, 29, 30, 31, 32, 40], "cost": [17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 36, 37, 40], "cost_flood": 16, "cost_object": [17, 18, 19, 23, 24, 25], "crash": [27, 28], "creat": [4, 6, 7, 8, 44, 45, 47], "creation": 47, "criteria": 39, "ctrl_cost": 47, "cumul": [49, 50], "current": [4, 6, 7, 8, 40], "custom": 47, "d": [11, 12, 43], "da": [2, 41, 44], "dall": [4, 6, 7, 8], "dam": [16, 40], "danoi": [2, 41, 44], "deal": 48, "death": 16, "decis": 40, "decomposit": 43, "deep": [3, 12, 49, 50], "deep_sea_treasur": 47, "deepseatreasur": [6, 7, 8], "default": [6, 7, 8, 13, 14, 15, 29, 30, 31, 32, 40], "deficit": 40, "deficit_wat": 16, "defin": [4, 5, 16, 34, 48], "definit": [44, 45], "deliv": [4, 12], "demand": 40, "deni": [3, 9], "dens": [13, 14, 15], "dep": 47, "depend": [44, 46], "deprec": 47, "depth": [11, 12], "deque_s": 49, "descript": [5, 12, 16, 38], "design": [47, 49], "desir": 47, "destin": 12, "detail": [5, 44, 45], "determin": 47, "determinist": 47, "develop": 44, "deviat": 50, "di": 35, "diamond": 39, "dict": 4, "dictionari": [4, 12], "did": 4, "differ": [4, 12, 47], "dim_reward": 49, "dimens": [4, 47], "dimension": [6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 39], "directli": [47, 49, 50], "directori": 48, "dirhtml": 1, "disc_episode_return": 47, "discord": [3, 44], "discount": [48, 49, 50], "discret": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 21, 22, 27, 29, 30, 31, 32, 34, 35, 38, 39, 47], "dissert": 5, "distanc": [34, 48], "distinct": 47, "distribut": 43, "do": 47, "doc": [1, 47], "document": [44, 48], "doe": [44, 46, 50], "doi": 40, "domain": 47, "done": [48, 49], "dot": 50, "down": [6, 7, 8, 10, 39], "downstream": 40, "dr": [49, 50], "drop": [4, 47], "dst": [12, 47], "dst_map": [6, 7, 8], "dtype": [47, 49], "due": [5, 40], "dynmorl": 3, "e": [1, 2, 4, 6, 7, 8, 12, 33, 41, 44, 47], "each": [4, 6, 7, 8, 11, 13, 14, 15, 29, 30, 31, 32, 33, 34, 47, 49], "eat": 12, "edit": 47, "effici": 43, "either": 9, "el": [2, 41, 44], "elaps": [49, 50], "elbow": 34, "element": [39, 47], "els": [10, 35, 39], "en": 50, "enabl": 47, "end": [9, 13, 14, 15, 49], "enemi": [4, 12, 16, 35, 39], "energi": 38, "engin": [27, 28], "entri": 43, "entry_point": 48, "env": [3, 5, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 37, 38, 44, 45, 47, 48, 49, 50], "env_fn": 49, "environ": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 43, 44, 45, 46, 49], "episod": [9, 40, 49, 50], "epsilon": 50, "equival": 5, "error": 47, "esr": [12, 47], "essenti": [44, 48], "et": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 38, 43], "eval_mo": 47, "everi": [1, 11, 12, 50], "exampl": [10, 42, 44, 45, 47, 49, 50], "except": 50, "excess": 40, "execut": [16, 40], "exhaust": 47, "expand": 47, "expect": 9, "extend": 47, "extra": [5, 29, 30, 31, 32], "extract": 50, "ezpickl": 47, "f": [3, 40], "fair": 43, "fall": 47, "fals": [17, 18, 19, 23, 24, 25, 49], "famili": [44, 46], "fan": 43, "fantasi": [6, 7, 8], "far": 35, "farama": [3, 13, 14, 15, 17, 19, 20, 23, 25, 26, 34, 36, 37, 44, 47], "fast": [16, 47], "fat": [11, 12], "featur": [3, 10, 47], "feder": 43, "felten": [2, 12, 41, 43, 44], "felten_toolkit_2023": [41, 44], "few": [47, 49, 50], "ffelten": 47, "file": [13, 14, 15, 47, 48], "fill": [13, 14, 15], "finger_tip_coord": 34, "fire": 12, "first": [2, 13, 14, 15, 40, 43, 47, 49], "fish": [9, 12], "fish_amount": 12, "fisherman": 9, "fishproba": 9, "fishwood": [3, 12, 47], "fit": 40, "fix": 10, "flag": [4, 17, 18, 19, 23, 24, 25, 35, 39, 48], "flexibl": 47, "float": [40, 48, 49, 50], "float32": [17, 18, 19, 20, 23, 24, 25, 26, 28, 33, 36, 37, 40, 49], "float_stat": [6, 7, 8], "flood": 40, "florian": [2, 41, 44], "folder": [1, 47], "follow": [2, 10, 13, 14, 15, 17, 18, 19, 20, 23, 24, 25, 26, 29, 30, 31, 32, 36, 37, 44, 45, 47, 48], "forc": [17, 19, 26], "forgotten": 47, "fork": 1, "form": 49, "formerli": [2, 43], "forward": [5, 20, 23, 24, 25, 26, 29, 30, 31, 32, 36, 37], "forward_penalti": 5, "forward_reward": 47, "found": 47, "foundat": [13, 14, 15, 47], "four": [3, 12, 34], "frame": 50, "frame_skip": [13, 14, 15], "frameskip": 50, "framework": 43, "from": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 26, 39, 40, 47, 48, 49, 50], "front": 48, "fruit": [3, 12], "fruit_tre": 47, "fuel": [5, 13, 14, 15, 16, 27, 28, 33], "fuel_consumption_penalti": 5, "full": [11, 12, 47], "function": [44, 45, 47], "g": [10, 12, 47], "gamma": [48, 49, 50], "gather": [12, 47], "gem": [4, 12, 39], "gener": [43, 47, 48], "get": 47, "gg": 44, "ghazali": [2, 41, 44], "gif": 47, "gimelfarb": [3, 10], "github": [3, 13, 14, 15, 47], "give": 5, "given": 50, "go": [1, 9, 11, 23, 24, 25, 29, 30, 31, 32], "goal": [10, 12, 29, 30, 31, 32, 33], "goe": 48, "goir": [2, 41, 44], "gold": [4, 12, 39], "gr": [2, 41, 44], "green": 10, "grid": [6, 7, 8], "gridworld": [10, 12], "ground": 4, "group": 47, "gt": 47, "guarante": 43, "guid": [44, 45], "gupta": 5, "gym": [2, 35, 43, 44, 45, 47], "gymnasium": [2, 5, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 42, 43, 44, 45, 46, 48, 49, 50], "ha": [4, 5, 17, 19, 20, 23, 25, 26, 35, 47, 49], "half_cheetah": 20, "halfcheetah": [38, 47], "halfcheetahenv": 20, "harder": 12, "hartmann": 43, "have": [3, 4, 5, 12, 44, 47, 50], "hay": 3, "healthi": [17, 18, 19], "heavili": 50, "height": 38, "help": 3, "here": [3, 10, 44, 45, 47], "high": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 47], "higher": 47, "highwai": [16, 47], "highwayenv": 21, "highwayfastenv": 22, "home": [4, 39], "hopper": [38, 47], "hopperenv": [23, 24, 25], "hotfix": 47, "how": [1, 13, 14, 15, 35, 42, 47], "html": 50, "http": [3, 4, 6, 7, 8, 13, 14, 15, 17, 19, 20, 23, 25, 26, 34, 36, 37, 39, 40, 44, 50], "human": [13, 14, 15, 40], "humanoid": [38, 47], "humanoidenv": 26, "humonoid": 38, "hung": 5, "hydroelectr": 40, "hyperparamet": 43, "i": [1, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 42, 44, 45, 47, 48, 49, 50], "ianleongudri": 47, "id": [17, 19, 23, 25, 48], "idx": 50, "igd": 48, "ijcnn": 40, "illustr": 47, "imag": [13, 14, 15, 16, 40], "image_observ": [13, 14, 15], "impact": 4, "implement": [4, 42, 48], "import": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "improv": 43, "includ": [16, 17, 19, 26, 44, 46], "inconsist": 47, "increment": [13, 14, 15], "incremental_frame_skip": [13, 14, 15], "index": [49, 50], "indic": [4, 10, 39, 47, 49], "inf": [4, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 40], "info": [44, 45, 47, 48, 49, 50], "info_dict": 47, "inform": [1, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 41, 44], "inher": 47, "inherit": 48, "init": 47, "initi": [40, 48], "initial_st": 40, "inproceed": [2, 41, 44], "inspir": 50, "instal": 1, "instanc": [44, 45, 47], "instanti": [17, 19, 23, 25], "instead": [4, 17, 19, 23, 25, 47], "int": [49, 50], "int32": 49, "integ": 48, "integr": 47, "intellig": 2, "interact": [44, 45], "intern": [39, 40], "introduc": [5, 10, 47], "invert": 48, "io": [4, 6, 7, 8, 39, 50], "issu": 47, "itch": [4, 6, 7, 8, 39], "item": [10, 12], "item1": 12, "item2": 12, "item3": 12, "iter": [40, 49], "its": 48, "ivanov": 43, "j": 47, "johnson": 47, "join": [3, 44], "joint": [34, 40], "json": [13, 14, 15], "jump": [23, 24, 25], "kallinteri": 47, "katze2664": 47, "keep": [49, 50], "kei": [4, 49], "kill": [12, 35, 39], "klassert": 4, "known": 48, "kwarg": 48, "l": [2, 41, 44, 49, 50], "lack": 5, "lambda": 49, "land": [5, 27, 28], "lander": [5, 47], "lane": [16, 21], "larger": 4, "last": [49, 50], "leaf": [11, 12], "learn": [2, 4, 9, 10, 39, 41, 43, 44, 45, 47], "left": [4, 6, 7, 8, 10, 11, 13, 14, 15, 39], "length": [49, 50], "length_queu": 49, "leon": 39, "level": [40, 47], "leverag": 43, "librari": [2, 43, 44, 47], "life": 47, "light": 12, "like": [3, 44, 46, 50], "limezu": [4, 39], "limit": 16, "line": 48, "linear": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "linearli": 47, "linearreward": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "linearwrapp": 47, "link": 47, "lint": 47, "list": [4, 47], "literatur": 47, "local": 5, "locat": [4, 12, 34], "logo": 47, "look": 50, "low": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "lower": 10, "luca": [2, 41, 44], "lucasalegr": 47, "lunar": [5, 47], "lunarland": [5, 27, 28], "m": 40, "machin": 39, "made": [1, 47], "mai": 47, "main": [3, 13, 14, 15, 27, 28, 36, 37], "main_engine_fuel": 5, "make": [1, 4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "mani": [13, 14, 15, 49], "map": [6, 7, 8, 10, 12, 13, 14, 15, 47], "mario": [35, 47], "mark": 47, "markov": 40, "master": 50, "match": 47, "mathieu": [3, 40], "max": 50, "max_r": 50, "max_t": 9, "maxandskipenv": 50, "maxima": 5, "maximum": 40, "maze": 10, "md": [1, 47], "mdp": [44, 45, 47], "mean": 50, "merg": [5, 29, 30, 31, 32], "merge_move_penalti": [29, 30, 31, 32], "method": [47, 48], "metric": 48, "mgoulao": 47, "mike": [3, 10], "min": 50, "min_r": 50, "mine": [13, 14, 15], "mine_config": [13, 14, 15], "minecart": [3, 16, 44, 45, 47], "miner": [11, 12], "minerium": [13, 14, 15], "minim": [13, 14, 15, 16], "minor": 47, "mirror": 12, "mirrored_map": [6, 7, 8], "miss": [43, 47], "mistak": 47, "mo": [2, 3, 5, 13, 14, 15, 16, 38, 42, 43, 44, 45, 46, 48, 49, 50], "mo_gym": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 49, 50], "mo_gymnasium": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "mode": [13, 14, 15, 40], "model": [43, 44, 45], "modem": 43, "modifi": 47, "modul": [49, 50], "mofl": 43, "momaxandskipobserv": 47, "momdp": [44, 45, 47], "monormalizereward": 47, "more": [1, 5, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 44, 45], "morecordepisodestatist": 47, "moreov": [48, 49], "morewordstatist": 49, "morl": [3, 6, 7, 8, 9, 44, 45, 47], "most": 49, "mountain": [5, 29, 30, 31, 32, 33, 47], "mountaincar": [5, 33], "mountaincarcontinu": [5, 47], "move": [4, 5, 35, 36, 39, 47, 50], "move_penalti": 5, "much": 35, "mujoco": [17, 19, 20, 23, 25, 26, 34, 36, 37, 44, 46], "multi": [2, 5, 9, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 40, 41, 43, 44, 45, 47, 48], "multibinari": 4, "multiobject": 4, "multipl": [4, 39, 42, 43, 47, 48, 49], "must": [12, 13, 14, 15, 16, 48], "my_env_dir": 48, "my_env_fil": 48, "my_env_v0": 48, "myenv": 48, "mypi": 47, "n": [2, 41, 44], "nO": 40, "narayanan": [12, 39], "ndarrai": 50, "need": 47, "neg": [10, 33, 34], "neighbour": 16, "network": 40, "neural": [40, 41, 44], "neurip": [41, 43, 44], "next": 48, "next_ob": [44, 45, 47], "ninjikin": [4, 39], "nip": 10, "node": 11, "none": [13, 14, 15, 40, 47, 50], "norm": 33, "norm_treasure_env": 50, "normal": [40, 47, 49, 50], "normalized_act": 40, "note": [4, 50], "notebook": [44, 45], "now": [2, 17, 19, 23, 25, 26, 41, 44, 47], "np": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "num": 49, "num_env": 49, "number": [4, 40], "numpi": [44, 45, 47, 48], "nutri1": 12, "nutri6": 12, "nutrient": [11, 12], "ob": [5, 12, 16, 38, 44, 45, 47, 49], "object": [2, 5, 9, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 40, 41, 43, 44, 45, 47, 48], "observ": [12, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 47, 48, 50], "observation_spac": 48, "observationspac": 47, "obstyp": 50, "off": 47, "oject": 48, "onc": 1, "one": [44, 46, 47, 50], "onli": [40, 50], "open": [43, 44], "opengameart": 40, "optim": [39, 43, 47], "option": [29, 30, 31, 32, 44, 45, 47, 48], "order": 47, "ore1": 16, "ore2": 16, "ores": [13, 14, 15, 16], "org": [17, 19, 20, 23, 25, 26, 34, 36, 37, 40, 44], "orient": [13, 14, 15], "origin": [4, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "other": [16, 17, 18, 19, 20, 23, 24, 25, 44, 45, 47, 50], "otherwis": [4, 9, 35], "our": [1, 47, 48], "out": [3, 40], "outcom": 4, "output": 49, "packag": [1, 47], "paper": 4, "pareto": [43, 48], "pareto_front": [47, 48], "parisi": 40, "part": [47, 48], "pass": [35, 47], "passag": 10, "path": [13, 14, 15], "paulina": 40, "penal": 40, "penalti": [4, 5, 6, 7, 8, 12, 29, 30, 31, 32, 33, 35], "peopl": 3, "percentag": 40, "perform": [47, 48], "person": 43, "pf": 47, "pianosi": [16, 40], "pick": 4, "pip": [1, 44, 46], "pixel": [4, 6, 7, 8, 47], "plan": [44, 45], "pleas": [41, 43, 44], "plu": 10, "point": 35, "polici": [39, 43], "porcentag": [13, 14, 15], "port": 40, "posit": [5, 6, 7, 8, 10, 13, 14, 15, 34, 35, 39], "possibl": [4, 34], "potenti": [4, 12, 47], "pp": 40, "practic": [44, 45], "pranav": 5, "pranavg23": 47, "pre": 47, "predefin": 47, "prefer": 47, "prevent": 5, "previous": 47, "priorit": 43, "prob_drop": 4, "probabl": [4, 9], "problem": [4, 6, 7, 8, 9, 40, 47], "problemat": [44, 46], "proceed": [2, 39, 41, 44], "process": [41, 44], "product": 50, "project": 3, "protein": [11, 12], "provid": [3, 9, 44, 47, 49], "pseudo": 47, "public": [2, 44], "publish": 43, "pull": [43, 48], "py": [47, 48], "pydoc": 47, "pymoo": 47, "pypi": 47, "pytest": 48, "python": [44, 45, 47], "q": 40, "qld": 40, "qualiti": 47, "quantiti": [13, 14, 15], "question": 3, "r": [1, 49, 50], "r_i": 34, "randint": 47, "random": 40, "rang": [47, 49], "rather": 4, "reach": [3, 6, 7, 8, 10, 11, 12, 16, 29, 30, 31, 32, 33, 35, 47], "reacher": 38, "read": 5, "readm": 47, "readthedoc": 50, "reason": 5, "rebuild": 1, "receiv": [11, 47], "recent": 49, "recov": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "red": 10, "refactor": [3, 13, 14, 15], "refer": 48, "registr": 48, "registri": 48, "reinforc": [2, 4, 9, 10, 41, 43, 44, 45, 47], "reinject": 50, "relax": [2, 41, 44], "releas": [16, 40], "reli": 47, "reliabl": [41, 43, 44], "remov": [29, 30, 31, 32, 47], "remove_move_penalti": [29, 30, 31, 32], "renam": 47, "render": [13, 14, 15, 40, 48], "render_mod": [13, 14, 15, 40], "repeat": [13, 14, 15], "repositori": [41, 42, 44, 48], "repres": 47, "request": 43, "requir": 1, "research": [41, 43, 44], "reservoir": [3, 16, 47], "reset": [44, 45, 47, 48, 49, 50], "resourc": [12, 47], "respect": 49, "restelli": 40, "retriev": [13, 14, 15], "return": [9, 13, 14, 15, 39, 44, 47, 48, 50], "return_queu": 49, "revamp": 47, "revers": [4, 5, 29, 30, 31, 32], "reverse_penalti": 5, "reward": [5, 22, 44, 45, 47, 48, 49, 50], "reward_dim": 48, "reward_spac": [47, 48], "reymond": [3, 40], "rgb": [13, 14], "rgb_arrai": [13, 14, 15, 40], "right": [4, 6, 7, 8, 10, 11, 13, 14, 15, 21, 39], "right_lan": 16, "rightest": 16, "riva": 40, "rl": 47, "rnd": 47, "robert": 4, "rodriguez": 43, "roijer": 12, "room": [3, 12], "root": [11, 47], "run": [20, 26, 37, 48, 49], "runzheyang": 3, "safeti": 4, "same": [6, 7, 8], "sampl": [43, 49], "save": 47, "scalar": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 50], "scale": [20, 26], "scenario": 47, "scott": 47, "sea": [3, 12, 49, 50], "sebimarkgraf": 47, "second": [13, 14, 15], "section": 4, "see": [10, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 44, 45, 47, 48], "seed": [48, 49], "select": 40, "self": [47, 48], "sens": 50, "separ": [10, 17, 19, 23, 25], "serenevillagerevamp": [4, 39], "serial": 49, "server": [3, 44], "set": [17, 18, 19, 23, 24, 25, 44, 47, 48], "setup": 47, "shape": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 48, 49], "shaped_reward": 5, "should": [47, 48], "shown": 47, "side": [27, 28], "side_engine_fuel": 5, "signal": 5, "silva": [2, 41, 44], "similar": [38, 47, 49], "similarli": [5, 16], "simon": 40, "simpl": [9, 44, 45], "simpli": 3, "sin": [13, 14, 15, 34], "sinc": [48, 49, 50], "singl": [29, 30, 31, 32, 47], "size": [4, 11, 48], "skip": 50, "sky": 40, "small": [4, 47], "smooth": 50, "snippet": 47, "so": 4, "some": [3, 44, 46, 48], "soto": 43, "sourc": [6, 7, 8, 10, 12, 13, 14, 15, 33, 44], "space": [5, 12, 16, 22, 38, 47, 48], "spars": [13, 14, 15], "specif": 49, "specifi": 4, "speed": [5, 13, 14, 15, 16, 21, 29, 30, 31, 32, 47], "speed_object": 5, "spell": 47, "sphinx": 1, "split": 10, "squar": 10, "srini": 39, "stabil": 50, "stabl": [47, 50], "stable_baselines3": 50, "stai": 16, "standard": [44, 47, 50], "static": 5, "statist": 49, "stats_kei": [49, 50], "steckelmach": [3, 9], "step": [4, 5, 6, 7, 8, 9, 29, 30, 31, 32, 33, 35, 40, 43, 44, 45, 47, 48, 49], "store": 49, "str": [49, 50], "structur": 47, "sub": 49, "submarin": [6, 7, 8, 12], "submiss": 43, "subpackag": 47, "successfulli": [27, 28], "successor": [3, 10], "suit": 44, "super": 35, "supermario": [3, 16], "supermariobro": 35, "supermariobrosenv": 16, "suppli": 40, "support": 16, "swimmer": [38, 47], "swimmerenv": 36, "system": [41, 44, 46], "t": [49, 50], "tailor": 47, "take": [4, 12], "taken": 12, "talbi": [2, 41, 44], "target": 34, "target_1": 38, "target_2": 38, "target_3": 38, "target_4": 38, "target_i": 34, "taxonomi": 43, "termin": [44, 45, 47, 48, 49], "th": 50, "than": 4, "thank": 3, "thei": [47, 49, 50], "them": [3, 4, 5, 44, 45], "therefor": 11, "thi": [1, 4, 41, 44, 45, 46, 47, 48, 49, 50], "those": 10, "thought": 47, "three": [12, 47], "threshold": 40, "thrill": 47, "through": 48, "thu": 47, "ti": 48, "time": [1, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 29, 30, 31, 32, 33, 35, 49, 50], "time_limit": 40, "time_penalti": [4, 5, 12], "timemov": 5, "timespe": 5, "timondesch": 47, "tip": 34, "titl": [2, 41, 44], "tomekst": 47, "tool": 47, "toolkit": [41, 43, 44], "top": [29, 30, 31, 32, 33], "torqu": 34, "touch": 50, "track": [49, 50], "trade": 47, "train": 50, "transfer": [3, 10], "transform": 47, "travel": 10, "treasur": [3, 4, 12, 39, 49, 50], "tree": [3, 12, 40], "triangl": 10, "true": [4, 6, 7, 8, 13, 14, 15, 40, 49], "truncat": [40, 44, 45, 47, 48, 49], "tuto": 47, "tutori": 48, "two": [9, 13, 14, 15, 16, 34, 35, 40, 50], "txt": 1, "type": [12, 13, 14, 15, 16, 47], "u": 3, "unbreakable_bottl": 4, "unbreakablebottl": 4, "under": [42, 47], "underwat": [6, 7, 8], "unpin": 47, "until": 40, "unwrap": 47, "up": [4, 6, 7, 8, 10, 39, 40], "upper": [13, 14, 15], "upstream": 40, "us": [6, 7, 8, 13, 14, 15, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "usag": 47, "user": 47, "util": [9, 47], "v0": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 21, 22, 29, 30, 31, 32, 33, 35, 39, 40, 44, 45, 49, 50], "v2": [5, 47], "v3": [27, 28, 47], "v4": [17, 18, 19, 20, 23, 24, 25, 26, 34, 47], "v5": [17, 19, 20, 23, 25, 26, 34, 36, 37, 38], "valu": [4, 6, 7, 8, 11, 12, 43], "vamplew": [5, 12], "variabl": 49, "variou": [3, 42], "vecenv": 47, "vector": [10, 11, 13, 14, 15, 29, 30, 31, 32, 33, 35, 44, 47, 48, 50], "vector_reward": [44, 45, 47], "vectorenv": 49, "vectori": 47, "vehicl": 16, "veloc": [17, 18, 19, 26, 34, 36, 37, 38], "veri": [44, 45, 48], "version": [5, 10, 12, 16, 18, 21, 22, 24, 27, 28, 29, 30, 31, 32, 33, 35, 38, 47], "via": [17, 19, 23, 25, 43, 49], "vitamin": [11, 12], "wa": [3, 4, 5, 6, 7, 8, 13, 14, 15, 43, 47], "wai": [3, 10], "walker2d": [38, 47], "walker2denv": 37, "wall": 10, "want": 3, "warn": [16, 47], "water": [3, 11, 12, 16, 47], "we": [3, 44, 47, 48], "websit": [44, 47], "weight": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 50], "welfar": 43, "well": [44, 47, 48], "were": 10, "what": 47, "when": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 35, 39, 47, 48], "where": [6, 7, 8, 9, 11, 29, 30, 31, 32, 33, 47], "whether": [13, 14, 15, 40], "which": [4, 5, 6, 7, 8, 9, 10, 44, 47, 48, 49, 50], "while": [4, 10, 12, 16], "within": [47, 48, 49], "without": [17, 19, 23, 25], "wood": [9, 12], "wood_amount": 12, "woodproba": 9, "work": [44, 49], "worker": 47, "workshop": [2, 43], "world": [6, 7, 8], "would": 3, "wrap": [47, 49], "wrapped_env": 49, "wrapper": [42, 44, 45, 47], "wrt": 40, "x": [6, 7, 8, 17, 18, 19, 23, 24, 25, 26, 35, 36, 37, 39], "x_po": 16, "x_veloc": [38, 47], "xu": 38, "y": [6, 7, 8, 17, 18, 19, 39], "y_veloc": 38, "yang": [6, 7, 8, 11, 12, 16], "year": [2, 41, 44], "you": [3, 41, 44, 45, 46, 47, 48], "your": [1, 41, 44], "your_ag": [44, 45, 47], "z": [23, 24, 25], "zero": [34, 47]}, "titles": ["404 - Page Not Found", "MO-Gymnasium documentation", "<no title>", "Community", "Breakable-Bottles", "Classic Control", "Deep-Sea-Treasure", "Deep-Sea-Treasure-Concave", "Deep-Sea-Treasure-Mirrored", "Fishwood", "Four-Room", "Fruit-Tree", "Grid-World", "Minecart", "Minecart-Deterministic", "Minecart-Rgb", "Miscellaneous", "MO-Ant", "MO-Ant-2D", "MO-Ant-2Obj", "MO-Halfcheetah", "MO-Highway", "MO-Highway-Fast", "MO-Hopper", "MO-Hopper-2D", "MO-Hopper-2Obj", "MO-Humanoid", "MO-Lunar-Lander", "MO-Lunar-Lander-Continuous", "MO-Mountaincar", "MO-Mountaincar-3D", "MO-Mountaincar-Timemove", "MO-Mountaincar-Timespeed", "MO-Mountaincarcontinuous", "MO-Reacher", "MO-Supermario", "MO-Swimmer", "MO-Walker2D", "MuJoCo", "Resource-Gathering", "Water-Reservoir", "Citation", "MORL Baselines", "List of Publications", "API", "API", "Install", "Release Notes", "Creating a custom environment", "Vector Wrappers", "Wrappers"], "titleterms": {"0": 47, "1": [47, 48], "2": [47, 48], "29": 47, "2d": [18, 24], "2obj": [19, 25], "3": [47, 48], "3d": 30, "4": [47, 48], "404": 0, "Not": 0, "The": 0, "acknowledg": 3, "action": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 34, 39, 40], "ant": [17, 18, 19], "api": [44, 45], "argument": [4, 6, 7, 8, 9, 10, 13, 14, 15, 40], "baselin": 42, "becom": 47, "better": 47, "bottl": [4, 47], "breakabl": [4, 47], "bug": 47, "build": 1, "citat": 41, "cite": 44, "class": 48, "classic": 5, "commun": 3, "concav": 7, "continu": 28, "control": 5, "could": 0, "creat": 48, "credit": [4, 6, 7, 8, 9, 10, 13, 14, 15, 39, 40], "custom": 48, "deep": [6, 7, 8, 47], "descript": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 39, 40], "determinist": 14, "document": [1, 47], "environ": [47, 48], "episod": [4, 6, 7, 8, 10, 11, 13, 14, 15, 35, 39], "evalu": 47, "fast": 22, "fishwood": 9, "fix": 47, "found": 0, "four": 10, "front": 47, "fruit": [11, 47], "gather": 39, "grid": 12, "gymnasium": [1, 47], "halfcheetah": 20, "highwai": [21, 22], "histori": [17, 19, 20, 23, 25, 26, 34, 36, 37], "hopper": [23, 24, 25], "humanoid": 26, "improv": 47, "instal": [44, 46], "instanti": 48, "known": 47, "lander": [27, 28], "linearreward": 50, "list": 43, "lunar": [27, 28], "matur": 47, "migrat": 47, "minecart": [13, 14, 15], "mirror": [8, 47], "miscellan": 16, "mo": [1, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 47], "moclipreward": 50, "momaxandskipobserv": 50, "monormalizereward": 50, "more": 47, "morecordepisodestatist": [49, 50], "morl": 42, "mosyncvectorenv": 49, "mountaincar": [29, 30, 31, 32, 47], "mountaincarcontinu": 33, "mujoco": [38, 47], "new": [47, 48], "note": 47, "observ": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 34, 39, 40], "page": [0, 47], "pareto": 47, "polici": 47, "public": 43, "pygam": 47, "reacher": [34, 47], "refer": 10, "regist": 48, "releas": 47, "render": 47, "request": 0, "reservoir": 40, "resourc": 39, "reward": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "rgb": 15, "room": 10, "sea": [6, 7, 8, 47], "space": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "start": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 39, 40], "state": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 39, 40], "supermario": 35, "support": 47, "swimmer": 36, "termin": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 35, 39], "test": [47, 48], "timemov": 31, "timespe": 32, "treasur": [6, 7, 8, 47], "tree": [11, 47], "updat": 47, "v0": 47, "v1": 47, "v5": 47, "vector": 49, "version": [17, 19, 20, 23, 25, 26, 34, 36, 37], "walker2d": 37, "water": 40, "webpag": 47, "world": 12, "wrapper": [49, 50], "your": 48}}) \ No newline at end of file