From de47aa3391faa047df88ebe3d7c2c821f6b12c14 Mon Sep 17 00:00:00 2001 From: LucasAlegre Date: Tue, 15 Oct 2024 19:57:51 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Farama-F?= =?UTF-8?q?oundation/MO-Gymnasium@7c471866b70e78a5ffed83ce1562548f5ca90914?= =?UTF-8?q?=20=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- main/.buildinfo | 2 +- main/404.html | 4 +- main/README/index.html | 4 +- main/_static/documentation_options.js | 2 +- main/_static/versioning/versioning_menu.html | 21 +- main/citing/citing/index.html | 4 +- main/community/community/index.html | 4 +- .../environments/breakable-bottles/index.html | 4 +- main/environments/classical/index.html | 4 +- .../deep-sea-treasure-concave/index.html | 4 +- .../deep-sea-treasure-mirrored/index.html | 4 +- .../environments/deep-sea-treasure/index.html | 4 +- main/environments/fishwood/index.html | 4 +- main/environments/four-room/index.html | 4 +- main/environments/fruit-tree/index.html | 4 +- main/environments/grid-world/index.html | 4 +- .../minecart-deterministic/index.html | 4 +- main/environments/minecart-rgb/index.html | 4 +- main/environments/minecart/index.html | 4 +- main/environments/misc/index.html | 4 +- main/environments/mo-ant-2d/index.html | 4 +- main/environments/mo-ant/index.html | 10 +- main/environments/mo-halfcheetah/index.html | 4 +- main/environments/mo-highway-fast/index.html | 4 +- main/environments/mo-highway/index.html | 4 +- main/environments/mo-hopper-2d/index.html | 4 +- main/environments/mo-hopper/index.html | 4 +- main/environments/mo-humanoid/index.html | 10 +- .../mo-lunar-lander-continuous/index.html | 10 +- main/environments/mo-lunar-lander/index.html | 10 +- .../environments/mo-mountaincar-3d/index.html | 4 +- .../mo-mountaincar-timemove/index.html | 4 +- .../mo-mountaincar-timespeed/index.html | 4 +- main/environments/mo-mountaincar/index.html | 4 +- .../mo-mountaincarcontinuous/index.html | 4 +- main/environments/mo-reacher/index.html | 6 +- main/environments/mo-supermario/index.html | 4 +- main/environments/mo-swimmer/index.html | 22 +- main/environments/mo-walker2d/index.html | 4 +- main/environments/mujoco/index.html | 4 +- .../resource-gathering/index.html | 4 +- main/environments/water-reservoir/index.html | 4 +- main/examples/citation/index.html | 4 +- main/examples/morl_baselines/index.html | 10 +- main/examples/publications/index.html | 4 +- main/genindex/index.html | 20 +- main/index.html | 6 +- main/introduction/api/index.html | 6 +- main/introduction/install/index.html | 4 +- main/objects.inv | Bin 1432 -> 1521 bytes main/release_notes/index.html | 6 +- main/search/index.html | 4 +- main/searchindex.js | 2 +- main/tutorials/custom_env/index.html | 4 +- main/wrappers/vector_wrappers/index.html | 713 ++++++++++++++++++ main/wrappers/wrappers/index.html | 90 ++- 56 files changed, 961 insertions(+), 137 deletions(-) create mode 100644 main/wrappers/vector_wrappers/index.html diff --git a/main/.buildinfo b/main/.buildinfo index d1c8f84c..b4768c37 100644 --- a/main/.buildinfo +++ b/main/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: 2612d33d1ddf2aea2ec6d1750c22baa3 +config: 8bb6dd5cc12145c199e1c822213cb7e5 tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/main/404.html b/main/404.html index bd608205..a34feb5b 100644 --- a/main/404.html +++ b/main/404.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -417,7 +419,7 @@

    The requested page could not be found. + diff --git a/main/README/index.html b/main/README/index.html index 1a0b019b..7fb6c104 100644 --- a/main/README/index.html +++ b/main/README/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -434,7 +436,7 @@

    Build the Documentation + diff --git a/main/_static/documentation_options.js b/main/_static/documentation_options.js index 6fe7b331..59816731 100644 --- a/main/_static/documentation_options.js +++ b/main/_static/documentation_options.js @@ -1,5 +1,5 @@ const DOCUMENTATION_OPTIONS = { - VERSION: '1.1.0', + VERSION: '1.2.0', LANGUAGE: 'en', COLLAPSE_INDEX: false, BUILDER: 'dirhtml', diff --git a/main/_static/versioning/versioning_menu.html b/main/_static/versioning/versioning_menu.html index 7a20036b..68109cf8 100644 --- a/main/_static/versioning/versioning_menu.html +++ b/main/_static/versioning/versioning_menu.html @@ -122,15 +122,18 @@ }); const sortVersions = (a, b) => { - const normVersionNames = (a) => { - return a.replace("v", "").split(""); - }; - const innerA = normVersionNames(a); - const innerB = normVersionNames(b); - - while (innerA.length && innerB.length) { - const charA = innerA.shift(); - const charB = innerB.shift(); + const innerA = a.replace("v", ""); + const innerB = b.replace("v", ""); + + if (innerA.match(/[a-z]/) && !innerB.match(/[a-z]/)) return 1; + if (!innerA.match(/[a-z]/) && innerB.match(/[a-z]/)) return -1; + + const splittedInnerA = innerA.split(""); + const splittedInnerB = innerB.split(""); + + while (splittedInnerA.length && splittedInnerB.length) { + const charA = splittedInnerA.shift(); + const charB = splittedInnerB.shift(); if (charA === charB) continue; else if (charA === ".") return 1; diff --git a/main/citing/citing/index.html b/main/citing/citing/index.html index 4f697fff..587905c2 100644 --- a/main/citing/citing/index.html +++ b/main/citing/citing/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -403,7 +405,7 @@ - + diff --git a/main/community/community/index.html b/main/community/community/index.html index 1b796669..c1a5ea80 100644 --- a/main/community/community/index.html +++ b/main/community/community/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -448,7 +450,7 @@

    Acknowledgements + diff --git a/main/environments/breakable-bottles/index.html b/main/environments/breakable-bottles/index.html index 906af64d..d65bffb3 100644 --- a/main/environments/breakable-bottles/index.html +++ b/main/environments/breakable-bottles/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -517,7 +519,7 @@

    Credits¶ - + diff --git a/main/environments/classical/index.html b/main/environments/classical/index.html index 977bf31a..0cf2ce88 100644 --- a/main/environments/classical/index.html +++ b/main/environments/classical/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -466,7 +468,7 @@

    Classic Control + diff --git a/main/environments/deep-sea-treasure-concave/index.html b/main/environments/deep-sea-treasure-concave/index.html index f3be3fbc..b9dc38bd 100644 --- a/main/environments/deep-sea-treasure-concave/index.html +++ b/main/environments/deep-sea-treasure-concave/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -520,7 +522,7 @@

    Credits¶ - + diff --git a/main/environments/deep-sea-treasure-mirrored/index.html b/main/environments/deep-sea-treasure-mirrored/index.html index 5b4c9bc0..4ff35b44 100644 --- a/main/environments/deep-sea-treasure-mirrored/index.html +++ b/main/environments/deep-sea-treasure-mirrored/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -510,7 +512,7 @@

    Credits¶ - + diff --git a/main/environments/deep-sea-treasure/index.html b/main/environments/deep-sea-treasure/index.html index ebc2dbea..37335e52 100644 --- a/main/environments/deep-sea-treasure/index.html +++ b/main/environments/deep-sea-treasure/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -508,7 +510,7 @@

    Credits¶ - + diff --git a/main/environments/fishwood/index.html b/main/environments/fishwood/index.html index 3cfe8994..389cffcf 100644 --- a/main/environments/fishwood/index.html +++ b/main/environments/fishwood/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -505,7 +507,7 @@

    Credits¶ - + diff --git a/main/environments/four-room/index.html b/main/environments/four-room/index.html index 876827dd..19e87389 100644 --- a/main/environments/four-room/index.html +++ b/main/environments/four-room/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -507,7 +509,7 @@

    Credits¶ - + diff --git a/main/environments/fruit-tree/index.html b/main/environments/fruit-tree/index.html index 47f1bad9..413e6361 100644 --- a/main/environments/fruit-tree/index.html +++ b/main/environments/fruit-tree/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -484,7 +486,7 @@

    Episode Termination + diff --git a/main/environments/grid-world/index.html b/main/environments/grid-world/index.html index e8e395fa..4a1e46d8 100644 --- a/main/environments/grid-world/index.html +++ b/main/environments/grid-world/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -473,7 +475,7 @@

    Grid-World + diff --git a/main/environments/minecart-deterministic/index.html b/main/environments/minecart-deterministic/index.html index 703257cd..4b865583 100644 --- a/main/environments/minecart-deterministic/index.html +++ b/main/environments/minecart-deterministic/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -532,7 +534,7 @@

    Credits¶ - + diff --git a/main/environments/minecart-rgb/index.html b/main/environments/minecart-rgb/index.html index 5cda0f46..31fc55a0 100644 --- a/main/environments/minecart-rgb/index.html +++ b/main/environments/minecart-rgb/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -522,7 +524,7 @@

    Credits¶ - + diff --git a/main/environments/minecart/index.html b/main/environments/minecart/index.html index e58929aa..96e16273 100644 --- a/main/environments/minecart/index.html +++ b/main/environments/minecart/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -520,7 +522,7 @@

    Credits¶ - + diff --git a/main/environments/misc/index.html b/main/environments/misc/index.html index 54dfeee6..06636781 100644 --- a/main/environments/misc/index.html +++ b/main/environments/misc/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -453,7 +455,7 @@

    Miscellaneous + diff --git a/main/environments/mo-ant-2d/index.html b/main/environments/mo-ant-2d/index.html index 6a9d3ba2..62116594 100644 --- a/main/environments/mo-ant-2d/index.html +++ b/main/environments/mo-ant-2d/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -464,7 +466,7 @@

    Reward Space + diff --git a/main/environments/mo-ant/index.html b/main/environments/mo-ant/index.html index 286e5dba..ad0566eb 100644 --- a/main/environments/mo-ant/index.html +++ b/main/environments/mo-ant/index.html @@ -8,7 +8,7 @@ - + @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -385,12 +387,12 @@

    Reward Space - +
    Next
    -
    MO-Humanoid
    +
    MO-Swimmer
    @@ -474,7 +476,7 @@

    Reward Space + diff --git a/main/environments/mo-halfcheetah/index.html b/main/environments/mo-halfcheetah/index.html index 8f499182..db2807c5 100644 --- a/main/environments/mo-halfcheetah/index.html +++ b/main/environments/mo-halfcheetah/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -473,7 +475,7 @@

    Reward Space + diff --git a/main/environments/mo-highway-fast/index.html b/main/environments/mo-highway-fast/index.html index e193c216..b1e48a02 100644 --- a/main/environments/mo-highway-fast/index.html +++ b/main/environments/mo-highway-fast/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -426,7 +428,7 @@

    MO-Highway-Fast + diff --git a/main/environments/mo-highway/index.html b/main/environments/mo-highway/index.html index 3e0aa320..19c60fda 100644 --- a/main/environments/mo-highway/index.html +++ b/main/environments/mo-highway/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -469,7 +471,7 @@

    Reward Space + diff --git a/main/environments/mo-hopper-2d/index.html b/main/environments/mo-hopper-2d/index.html index 923f4f72..3377ff96 100644 --- a/main/environments/mo-hopper-2d/index.html +++ b/main/environments/mo-hopper-2d/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -463,7 +465,7 @@

    Reward Space + diff --git a/main/environments/mo-hopper/index.html b/main/environments/mo-hopper/index.html index dcfc449b..1fb3f2d2 100644 --- a/main/environments/mo-hopper/index.html +++ b/main/environments/mo-hopper/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -473,7 +475,7 @@

    Reward Space + diff --git a/main/environments/mo-humanoid/index.html b/main/environments/mo-humanoid/index.html index daa8c2f0..a73342a4 100644 --- a/main/environments/mo-humanoid/index.html +++ b/main/environments/mo-humanoid/index.html @@ -8,7 +8,7 @@ - + @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -380,7 +382,7 @@

    Reward Space - + @@ -389,7 +391,7 @@

    Reward SpaceMO-Ant +
    MO-Swimmer
    @@ -470,7 +472,7 @@

    Reward Space + diff --git a/main/environments/mo-lunar-lander-continuous/index.html b/main/environments/mo-lunar-lander-continuous/index.html index 2a29011f..eb96dae6 100644 --- a/main/environments/mo-lunar-lander-continuous/index.html +++ b/main/environments/mo-lunar-lander-continuous/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -339,10 +341,10 @@

    MO-Lunar-Lander-Continuous

    Observation High

    -

    [1.5 1.5 5. 5. 3.14 5. 1. 1. ]

    +

    [ 2.5 2.5 10. 10. 6.28 10. 1. 1. ]

    Observation Low

    -

    [-1.5 -1.5 -5. -5. -3.14 -5. -0. -0. ]

    +

    [ -2.5 -2.5 -10. -10. -6.28 -10. -0. -0. ]

    Reward Shape

    (4,)

    @@ -354,7 +356,7 @@

    MO-Lunar-Lander-Continuous

    Import

    -

    mo_gymnasium.make("mo-lunar-lander-continuous-v2")

    +

    mo_gymnasium.make("mo-lunar-lander-continuous-v3")

    @@ -472,7 +474,7 @@

    Reward Space + diff --git a/main/environments/mo-lunar-lander/index.html b/main/environments/mo-lunar-lander/index.html index 99eef0c3..dd0b7dde 100644 --- a/main/environments/mo-lunar-lander/index.html +++ b/main/environments/mo-lunar-lander/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -339,10 +341,10 @@

    MO-Lunar-Lander

    Observation High

    -

    [1.5 1.5 5. 5. 3.14 5. 1. 1. ]

    +

    [ 2.5 2.5 10. 10. 6.28 10. 1. 1. ]

    Observation Low

    -

    [-1.5 -1.5 -5. -5. -3.14 -5. -0. -0. ]

    +

    [ -2.5 -2.5 -10. -10. -6.28 -10. -0. -0. ]

    Reward Shape

    (4,)

    @@ -354,7 +356,7 @@

    MO-Lunar-Lander

    Import

    -

    mo_gymnasium.make("mo-lunar-lander-v2")

    +

    mo_gymnasium.make("mo-lunar-lander-v3")

    @@ -470,7 +472,7 @@

    Reward Space + diff --git a/main/environments/mo-mountaincar-3d/index.html b/main/environments/mo-mountaincar-3d/index.html index d9226944..35045fa1 100644 --- a/main/environments/mo-mountaincar-3d/index.html +++ b/main/environments/mo-mountaincar-3d/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -461,7 +463,7 @@

    Reward space: + diff --git a/main/environments/mo-mountaincar-timemove/index.html b/main/environments/mo-mountaincar-timemove/index.html index 24366245..8e9b9c9d 100644 --- a/main/environments/mo-mountaincar-timemove/index.html +++ b/main/environments/mo-mountaincar-timemove/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -461,7 +463,7 @@

    Reward space: + diff --git a/main/environments/mo-mountaincar-timespeed/index.html b/main/environments/mo-mountaincar-timespeed/index.html index 503e55ae..cb088892 100644 --- a/main/environments/mo-mountaincar-timespeed/index.html +++ b/main/environments/mo-mountaincar-timespeed/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -461,7 +463,7 @@

    Reward space: + diff --git a/main/environments/mo-mountaincar/index.html b/main/environments/mo-mountaincar/index.html index 913beb91..21fefc46 100644 --- a/main/environments/mo-mountaincar/index.html +++ b/main/environments/mo-mountaincar/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -471,7 +473,7 @@

    Reward space: + diff --git a/main/environments/mo-mountaincarcontinuous/index.html b/main/environments/mo-mountaincarcontinuous/index.html index 15d2e4e0..0132d200 100644 --- a/main/environments/mo-mountaincarcontinuous/index.html +++ b/main/environments/mo-mountaincarcontinuous/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -464,7 +466,7 @@

    Reward space: + diff --git a/main/environments/mo-reacher/index.html b/main/environments/mo-reacher/index.html index 1df842fd..de4bd00e 100644 --- a/main/environments/mo-reacher/index.html +++ b/main/environments/mo-reacher/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -361,7 +363,7 @@

    MO-Reacher

    Description

    -

    Mujoco version of mo-reacher-v0, based on Reacher-v4 environment.

    +

    Multi-objective version of the Reacher-v4 environment.

    Observation Space

    @@ -481,7 +483,7 @@

    Reward Space + diff --git a/main/environments/mo-supermario/index.html b/main/environments/mo-supermario/index.html index aa8ccf8e..ea4a18a5 100644 --- a/main/environments/mo-supermario/index.html +++ b/main/environments/mo-supermario/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -476,7 +478,7 @@

    Episode Termination + diff --git a/main/environments/mo-swimmer/index.html b/main/environments/mo-swimmer/index.html index 1debafa9..48809779 100644 --- a/main/environments/mo-swimmer/index.html +++ b/main/environments/mo-swimmer/index.html @@ -11,7 +11,7 @@ - + MO-Swimmer - MO-Gymnasium Documentation @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -234,11 +235,14 @@
  • MO-Mountaincar
  • MO-Mountaincarcontinuous
  • MO-Lunar-Lander
  • +
  • MO-Lunar-Lander-Continuous
  • Miscellaneous @@ -317,9 +321,10 @@
    -

    MO-Swimmer#

    +

    MO-Swimmer

    -../../_images/mo-swimmer.gif +../../_images/mo-swimmer.gif +
    @@ -357,12 +362,15 @@

    MO-Swimmer -

    Description#

    +

    Description

    Multi-objective version of the SwimmerEnv environment.

    See Gymnasium’s env for more information.

    +

    The original Gymnasium’s ‘Swimmer-v4’ is recovered by the following linear scalarization:

    +

    env = mo_gym.make(‘mo-swimmer-v4’) +LinearReward(env, weight=np.array([1.0, 1e-4]))

    -

    Reward Space#

    +

    Reward Space

    The reward is 2-dimensional:

    Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -470,7 +472,7 @@

    Reward Space + diff --git a/main/environments/mujoco/index.html b/main/environments/mujoco/index.html index 901be049..40c4e4a4 100644 --- a/main/environments/mujoco/index.html +++ b/main/environments/mujoco/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -468,7 +470,7 @@

    MuJoCo + diff --git a/main/environments/resource-gathering/index.html b/main/environments/resource-gathering/index.html index 19a800a7..11289649 100644 --- a/main/environments/resource-gathering/index.html +++ b/main/environments/resource-gathering/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -507,7 +509,7 @@

    Credits¶ - + diff --git a/main/environments/water-reservoir/index.html b/main/environments/water-reservoir/index.html index 07c6a93a..1168e99d 100644 --- a/main/environments/water-reservoir/index.html +++ b/main/environments/water-reservoir/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -511,7 +513,7 @@

    Credits¶ - + diff --git a/main/examples/citation/index.html b/main/examples/citation/index.html index 0202d6a4..89d6c0c3 100644 --- a/main/examples/citation/index.html +++ b/main/examples/citation/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -414,7 +416,7 @@

    Citation - + diff --git a/main/examples/morl_baselines/index.html b/main/examples/morl_baselines/index.html index 60726a16..f52abf03 100644 --- a/main/examples/morl_baselines/index.html +++ b/main/examples/morl_baselines/index.html @@ -8,7 +8,7 @@ - + @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -348,7 +350,7 @@

    MORL Baselines - + @@ -357,7 +359,7 @@

    MORL BaselinesWrappers +
    Vector Wrappers
    @@ -418,7 +420,7 @@

    MORL Baselines + diff --git a/main/examples/publications/index.html b/main/examples/publications/index.html index 87533006..04305791 100644 --- a/main/examples/publications/index.html +++ b/main/examples/publications/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -422,7 +424,7 @@

    List of Publications + diff --git a/main/genindex/index.html b/main/genindex/index.html index 415f4885..2a922f00 100644 --- a/main/genindex/index.html +++ b/main/genindex/index.html @@ -213,6 +213,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -250,6 +251,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -325,7 +327,7 @@

    Index

    L

    @@ -335,15 +337,21 @@

    L

    M

    @@ -414,7 +422,7 @@

    M

    - + diff --git a/main/index.html b/main/index.html index 131ca8e1..6b7864c4 100644 --- a/main/index.html +++ b/main/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -366,7 +368,7 @@

    API

    next_obs, vector_reward, terminated, truncated, info = env.step(your_agent.act(obs)) # Optionally, you can scalarize the reward function with the LinearReward wrapper -env = mo_gym.LinearReward(env, weight=np.array([0.8, 0.2, 0.2])) +env = mo_gym.wrappers.LinearReward(env, weight=np.array([0.8, 0.2, 0.2]))

    For details on multi-objective MDP’s (MOMDP’s) and other MORL definitions, see A practical guide to multi-objective reinforcement learning and planning.

    @@ -457,7 +459,7 @@

    Citing + diff --git a/main/introduction/api/index.html b/main/introduction/api/index.html index c9c5e053..91ab4264 100644 --- a/main/introduction/api/index.html +++ b/main/introduction/api/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -342,7 +344,7 @@

    API

    next_obs, vector_reward, terminated, truncated, info = env.step(your_agent.act(obs)) # Optionally, you can scalarize the reward function with the LinearReward wrapper -env = mo_gym.LinearReward(env, weight=np.array([0.8, 0.2, 0.2])) +env = mo_gym.wrappers.LinearReward(env, weight=np.array([0.8, 0.2, 0.2]))

    For details on multi-objective MDP’s (MOMDP’s) and other MORL definitions, see A practical guide to multi-objective reinforcement learning and planning.

    @@ -423,7 +425,7 @@

    API

    + diff --git a/main/introduction/install/index.html b/main/introduction/install/index.html index dc03303d..d09f6d3b 100644 --- a/main/introduction/install/index.html +++ b/main/introduction/install/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -410,7 +412,7 @@

    Install¶ - + diff --git a/main/objects.inv b/main/objects.inv index 60846383e1b69cab31d21f5e6a41d6df7ef86e51..3ba6d0782e0893d074bd6c05b4e7acc7a196291f 100644 GIT binary patch delta 1417 zcmV;41$O$F3-Jq(dVj5%U2~);6o&8p6;#dMGVXj_O>J#ezIV2gnN;`G1LzS z1(;6nuiqnzA_Cfzy-5(x`y4(LUhR@UZjWU}B&*B!2SN6GD&+fHR#75W^gu+8_Qx+- zL8L?0Dg?}i;}bWAFi$zLYE&`fc0BDfVjp2S}ttL&$~xT;?MC+aElf@7I}ac-7( zFEIMIbZU$Yb!F!9!rt4ZoPR)P^ZB2|Q}T@n3-Zl8w5O%^!xr=+_^6+j-^DD*e9|K@ z--GZ?|M~aNNPnvQOU|=~372W}2VrziwiJEi3SINM%9GXA+2!4p9oyEV=(L1rHT3(^*0VJanfk;DfT zBu-ZdT{cx~sQS@WCCip!d5(VJrn&G%+mtL^q!W_%>*~pR*R_q)J~6pFa2`%#0#bC{ zl^g)C1%DQtmtlg5NSmER;1v`dhNzipMiHLiAp|J83Wo9!%a96rGDrClFLCAORS1Q29lSKEyXld)b( z-6xsRq97IJwex6~9Fr;DyCH49Pd${j%Z1`7+}myeII0zybDm5 zq~a{j>S9_{cQGLqbwvb*`z((S(2mo@TU~LhE27k9g9h7B!+pFofhC#bYBu$*ZIZSG z|9_+igH1m=7As8S?}qCb5`W4UQX$d><4>1SwqhkMdF0>=#82}4=o)6T$vvg{De1Jp zn@_jI5-z(1yaG327G8chfMI)yE`1lGp{uq$!N?k(x{?USW27NU!`A)fly_id8ShpX z(vsTp1alz8GZpdu!^CLNLwn)gclAF!i+_wvH-o>Ld)%aYoTDy%e~Y7kBgR8Ty! zP=0{xl@_sVw=`f~FBC-CZpbS)zGn%caXx;?$lxqO^%f@#96ZcoV(VhO$fc9-_bCI? z_8~!taUz4v@f|^>RudKRzI-%8w;4GyooR{Rd(6Kz0;;;R@aIwkfmC&BgWojhov=a&-R{f3g)2^tCl@ z^c;ATZ3QJi$bYt?c*~Wls5JVDY-yzlw0UKMH#%SDv)ud*E8oHp3#M4J%e#N>045zd z`m^CkF;M=M6}+z7hN)9Nv?juNcaE-XGb<@QU`Yv9FeKRuni%yg*N%GDfeYRgltHDs+VF4=k-;d8JBz|A6q(Y_-#_z9_Y{hC?^Tfp$$)DBv)^{vclLt!6bIKV(u%78j z6@Og!5eN$Wf<=7$;R1%^CAsx|ih*vr_6#Fi_}0}#FrFffSqAnvJkEGWQvIMJ{l&LA zhV|4v_#c?|UtT1JWV%7${==`lK?o|r4-^#dh=Lh==6)eHM;jaaWMfnOk-)VHODm~( zgLb#@L&N;6nSY@CPVlXLYZTVtGM=|Y(h4qL8I(^`^n!2h z(4~DIQHOS0fj!pzFvv~F(H)ou#9z>Z6V0ZcE&QWlbZz}_1ka>JRHIGnWjoq1I3Ryc zMK+qF&-!0Bru5T67Z0By3ckN=3$v``z}y7CFP|$|BNeHtsH*SRV=#?u;{3uB9DlrD zKfQ$4O9MQ&=i{uOTYzXsXQiY6iikP~Hc7V^e@db6{ZZtbtfRB>r4m+-q?BR<%jnxtj3!eP7cLe)fvk9nt*#F?#A-+5hrtKIHInstall
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -393,7 +395,7 @@

    MO-Gymnasium 1.0.0 Release Notes

    reward = forward_reward - ctrl_cost

    With MORL, users have the flexibility to determine the compromises they desire based on their preferences for each objective. Consequently, the environments in MO-Gymnasium do not have predefined weights. Thus, MO-Gymnasium extends the capabilities of Gymnasium to the multi-objective setting, where the agents receives a vectorial reward.

    For example, here is an illustration of the multiple policies learned by an MORL agent for the mo-halfcheetah domain, balancing between saving battery and speed:

    - +

    This release marks the first mature version of MO-Gymnasium within Farama, indicating that the API is stable, and we have achieved a high level of quality in this library.

    API

    + diff --git a/main/search/index.html b/main/search/index.html index d8f97aef..df585802 100644 --- a/main/search/index.html +++ b/main/search/index.html @@ -212,6 +212,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -249,6 +250,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -391,7 +393,7 @@ - + diff --git a/main/searchindex.js b/main/searchindex.js index b5f5fcce..d0037418 100644 --- a/main/searchindex.js +++ b/main/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"0.1.1": [[44, "release-0-1-1"]], "0.1.2": [[44, "release-0-1-2"]], "0.2.0": [[44, "release-0-2-0"]], "0.2.1": [[44, "release-0-2-1"]], "1. Create a new environment class": [[45, "create-a-new-environment-class"]], "2. Register the environment": [[45, "register-the-environment"]], "3. Test the environment": [[45, "test-the-environment"]], "4. Instantiate your environment": [[45, "instantiate-your-environment"]], "404 - Page Not Found": [[0, null]], "API": [[41, null], [42, null]], "Acknowledgements": [[3, "acknowledgements"]], "Action Space": [[4, "action-space"], [6, "action-space"], [7, "action-space"], [8, "action-space"], [9, "action-space"], [10, "action-space"], [11, "action-space"], [13, "action-space"], [14, "action-space"], [15, "action-space"], [32, "action-space"], [36, "action-space"], [37, "action-space"]], "Arguments": [[4, "arguments"], [6, "arguments"], [7, "arguments"], [8, "arguments"], [9, "arguments"], [10, "arguments"], [13, "arguments"], [14, "arguments"], [15, "arguments"], [37, "arguments"]], "Breakable-Bottles": [[4, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Citation": [[38, null]], "Citing": [[41, "citing"]], "Classic Control": [[5, null]], "Community": [[3, null]], "Creating a custom environment": [[45, null]], "Credits": [[4, "credits"], [6, "credits"], [7, "credits"], [8, "credits"], [9, "credits"], [10, "credits"], [13, "credits"], [14, "credits"], [15, "credits"], [36, "credits"], [37, "credits"]], "Deep-Sea-Treasure": [[6, null]], "Deep-Sea-Treasure-Concave": [[7, null]], "Deep-Sea-Treasure-Mirrored": [[8, null]], "Description": [[4, "description"], [6, "description"], [7, "description"], [8, "description"], [9, "description"], [10, "description"], [11, "description"], [13, "description"], [14, "description"], [15, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [22, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [32, "description"], [33, "description"], [34, "description"], [36, "description"], [37, "description"]], "Episode Termination": [[4, "episode-termination"], [6, "episode-termination"], [7, "episode-termination"], [8, "episode-termination"], [10, "episode-termination"], [11, "episode-termination"], [13, "episode-termination"], [14, "episode-termination"], [15, "episode-termination"], [33, "episode-termination"], [36, "episode-termination"]], "Fishwood": [[9, null]], "Four-Room": [[10, null]], "Fruit-Tree": [[11, null]], "Grid-World": [[12, null]], "Install": [[41, "install"], [43, null]], "LinearReward": [[46, "linearreward"]], "List of Publications": [[40, null]], "MO-Ant": [[17, null]], "MO-Ant-2D": [[18, null]], "MO-Gymnasium 0.3.0 Release: Migrate to Gymnasium": [[44, "release-0-3-0"]], "MO-Gymnasium 0.3.1 Release: Improved documentation and MuJoco MO-Reacher environment": [[44, "release-0-3-1"]], "MO-Gymnasium 0.3.2 Release: Bug fixes, improved webpage": [[44, "release-0-3-2"]], "MO-Gymnasium documentation": [[1, null]], "MO-Halfcheetah": [[19, null]], "MO-Highway": [[20, null]], "MO-Highway-Fast": [[21, null]], "MO-Hopper": [[22, null]], "MO-Hopper-2D": [[23, null]], "MO-Humanoid": [[24, null]], "MO-Lunar-Lander": [[25, null]], "MO-Lunar-Lander-Continuous": [[26, null]], "MO-Mountaincar": [[27, null]], "MO-Mountaincar-3D": [[28, null]], "MO-Mountaincar-Timemove": [[29, null]], "MO-Mountaincar-Timespeed": [[30, null]], "MO-Mountaincarcontinuous": [[31, null]], "MO-Reacher": [[32, null]], "MO-Supermario": [[33, null]], "MO-Walker2D": [[34, null]], "MOClipReward": [[46, "moclipreward"]], "MONormalizeReward": [[46, "monormalizereward"]], "MORL Baselines": [[39, null]], "MORecordEpisodeStatistics": [[46, "morecordepisodestatistics"]], "MOSyncVectorEnv": [[46, "mosyncvectorenv"]], "Minecart": [[13, null]], "Minecart-Deterministic": [[14, null]], "Minecart-Rgb": [[15, null]], "Miscellaneous": [[16, null]], "MuJoCo": [[35, null]], "Observation Space": [[4, "observation-space"], [6, "observation-space"], [7, "observation-space"], [8, "observation-space"], [9, "observation-space"], [10, "observation-space"], [11, "observation-space"], [13, "observation-space"], [14, "observation-space"], [15, "observation-space"], [32, "observation-space"], [36, "observation-space"], [37, "observation-space"]], "References": [[10, "references"]], "Release Notes": [[44, null]], "Resource-Gathering": [[36, null]], "Reward Space": [[4, "reward-space"], [6, "reward-space"], [7, "reward-space"], [8, "reward-space"], [9, "reward-space"], [10, "reward-space"], [11, "reward-space"], [13, "reward-space"], [14, "reward-space"], [15, "reward-space"], [17, "reward-space"], [18, "reward-space"], [19, "reward-space"], [20, "reward-space"], [22, "reward-space"], [23, "reward-space"], [24, "reward-space"], [25, "reward-space"], [26, "reward-space"], [32, "reward-space"], [33, "reward-space"], [34, "reward-space"], [36, "reward-space"], [37, "reward-space"]], "Reward space:": [[27, "reward-space"], [28, "reward-space"], [29, "reward-space"], [30, "reward-space"], [31, "reward-space"]], "Starting State": [[4, "starting-state"], [6, "starting-state"], [7, "starting-state"], [8, "starting-state"], [9, "starting-state"], [10, "starting-state"], [11, "starting-state"], [13, "starting-state"], [14, "starting-state"], [15, "starting-state"], [36, "starting-state"], [37, "starting-state"]], "Termination": [[9, "termination"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Water-Reservoir": [[37, null]], "Wrappers": [[46, null]], "v0.3.3: MO-Gymnasium 0.3.3 Release: Policy Evaluation bug fix, better documentation page": [[44, "release-v0-3-3"]], "v0.3.4: MO-Gymnasium 0.3.4 Release: Known Pareto Front, improved renders and documentation": [[44, "release-v0-3-4"]], "v1.0.0: MO-Gymnasium becomes mature": [[44, "release-v1-0-0"]], "v1.0.1: MO-Gymnasium 1.0.1 Release: Support Gymnasium 0.29, breakable-bottles pygame render, and more": [[44, "release-v1-0-1"]], "v1.1.0: MO-Gymnasium 1.1.0 Release: New MuJoCo environments, Mirrored Deep Sea Treasure, Fruit Tree rendering, and more": [[44, "release-v1-1-0"]]}, "docnames": ["404", "README", "citing/citing", "community/community", "environments/breakable-bottles", "environments/classical", "environments/deep-sea-treasure", "environments/deep-sea-treasure-concave", "environments/deep-sea-treasure-mirrored", "environments/fishwood", "environments/four-room", "environments/fruit-tree", "environments/grid-world", "environments/minecart", "environments/minecart-deterministic", "environments/minecart-rgb", "environments/misc", "environments/mo-ant", "environments/mo-ant-2d", "environments/mo-halfcheetah", "environments/mo-highway", "environments/mo-highway-fast", "environments/mo-hopper", "environments/mo-hopper-2d", "environments/mo-humanoid", "environments/mo-lunar-lander", "environments/mo-lunar-lander-continuous", "environments/mo-mountaincar", "environments/mo-mountaincar-3d", "environments/mo-mountaincar-timemove", "environments/mo-mountaincar-timespeed", "environments/mo-mountaincarcontinuous", "environments/mo-reacher", "environments/mo-supermario", "environments/mo-walker2d", "environments/mujoco", "environments/resource-gathering", "environments/water-reservoir", "examples/citation", "examples/morl_baselines", "examples/publications", "index", "introduction/api", "introduction/install", "release_notes", "tutorials/custom_env", "wrappers/wrappers"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["404.md", "README.md", "citing/citing.md", "community/community.md", "environments/breakable-bottles.md", "environments/classical.md", "environments/deep-sea-treasure.md", "environments/deep-sea-treasure-concave.md", "environments/deep-sea-treasure-mirrored.md", "environments/fishwood.md", "environments/four-room.md", "environments/fruit-tree.md", "environments/grid-world.md", "environments/minecart.md", "environments/minecart-deterministic.md", "environments/minecart-rgb.md", "environments/misc.md", "environments/mo-ant.md", "environments/mo-ant-2d.md", "environments/mo-halfcheetah.md", "environments/mo-highway.md", "environments/mo-highway-fast.md", "environments/mo-hopper.md", "environments/mo-hopper-2d.md", "environments/mo-humanoid.md", "environments/mo-lunar-lander.md", "environments/mo-lunar-lander-continuous.md", "environments/mo-mountaincar.md", "environments/mo-mountaincar-3d.md", "environments/mo-mountaincar-timemove.md", "environments/mo-mountaincar-timespeed.md", "environments/mo-mountaincarcontinuous.md", "environments/mo-reacher.md", "environments/mo-supermario.md", "environments/mo-walker2d.md", "environments/mujoco.md", "environments/resource-gathering.md", "environments/water-reservoir.md", "examples/citation.md", "examples/morl_baselines.md", "examples/publications.md", "index.md", "introduction/api.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "wrappers/wrappers.md"], "indexentries": {"linearreward (class in mo_gymnasium)": [[46, "mo_gymnasium.LinearReward", false]], "moclipreward (class in mo_gymnasium)": [[46, "mo_gymnasium.MOClipReward", false]], "monormalizereward (class in mo_gymnasium)": [[46, "mo_gymnasium.MONormalizeReward", false]], "morecordepisodestatistics (class in mo_gymnasium)": [[46, "mo_gymnasium.MORecordEpisodeStatistics", false]], "mosyncvectorenv (class in mo_gymnasium)": [[46, "mo_gymnasium.MOSyncVectorEnv", false]]}, "objects": {"mo_gymnasium": [[46, 0, 1, "", "LinearReward"], [46, 0, 1, "", "MOClipReward"], [46, 0, 1, "", "MONormalizeReward"], [46, 0, 1, "", "MORecordEpisodeStatistics"], [46, 0, 1, "", "MOSyncVectorEnv"]]}, "objnames": {"0": ["py", "class", "Python class"]}, "objtypes": {"0": "py:class"}, "terms": {"": [4, 5, 6, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 41, 42, 46], "0": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 41, 42, 46], "01": 44, "02": 44, "03": 44, "06": 44, "07": [27, 28, 29, 30, 31], "08": [44, 46], "09": 44, "1": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 46], "10": [6, 7, 8, 11, 12, 36, 37], "100": [25, 26, 33, 46], "11": [6, 7, 22, 23, 44], "1109": 37, "1145": 36, "12": 44, "124": [7, 8], "13": [10, 44], "1390156": 36, "1390162": 36, "14": [10, 25, 26, 44], "16": 44, "160": 37, "17": [19, 24, 34], "18": 44, "19": 44, "1e": 46, "2": [4, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 41, 42], "20": [8, 44], "200": 9, "2008": [12, 36], "2010": 12, "2011": 5, "2012": 37, "2013": 16, "2017": 10, "2018": 12, "2019": [6, 7, 8, 11, 12, 13, 14, 15, 16], "2020": 35, "2021": 12, "2022": [2, 5, 12, 40, 44], "2022bnaic": 2, "2023": [38, 40, 41, 44], "2024": [40, 44], "21": 44, "23": [6, 44], "24": 44, "240": [4, 33], "25": [33, 44], "255": [15, 33], "256": 33, "25th": 36, "26": 44, "27": [17, 18, 44], "2d": [6, 7, 8, 10, 13, 14, 15, 31, 44, 46], "3": [4, 6, 7, 8, 10, 13, 14, 15, 17, 18, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 32, 33, 36, 37], "30": 44, "31": 44, "33": 44, "34": 44, "34th": 2, "35": 44, "360": 4, "37": 44, "376": 24, "37th": [38, 41], "3d": [5, 13, 14, 15, 27, 29, 30], "4": [4, 6, 7, 8, 10, 13, 14, 15, 24, 25, 26, 32, 33, 36, 37], "40": 44, "41": [36, 44], "42": 44, "43": 44, "45": 44, "46": 44, "47": [36, 44], "480": 15, "5": [4, 11, 12, 13, 14, 15, 20, 21, 25, 26, 33, 36, 44], "50": [4, 44], "51": 44, "52": 44, "53": 44, "55": 44, "56": 44, "57": 44, "58": 44, "59": 44, "6": [11, 12, 13, 14, 15, 19, 27, 28, 29, 30, 31, 32, 34], "60": 44, "61": 44, "62": 44, "6252759": 37, "63": 11, "64": 44, "65": 44, "67": 44, "69": 44, "7": [6, 11, 12, 13, 14, 15, 44], "70": 44, "72": 44, "73": 44, "74": 44, "75": 44, "76": 44, "77": 44, "79": 44, "8": [17, 18, 25, 26, 37, 41, 42, 44], "80": 44, "81": 44, "83": 44, "84": 44, "86": 44, "87": 44, "9": 32, "99": 46, "A": [2, 4, 10, 16, 17, 18, 21, 27, 28, 29, 30, 31, 37, 38, 40, 41, 42, 46], "As": [4, 41, 42], "By": [27, 28, 29, 30, 37], "For": [1, 32, 41, 42, 44, 46], "If": [3, 13, 14, 15, 17, 18, 22, 23, 37, 38, 41, 45], "In": [4, 44], "It": [39, 41, 42, 44, 45], "Of": 44, "The": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 31, 32, 33, 34, 36, 37, 41, 44, 45], "There": 37, "To": [1, 6, 7, 8, 41, 43], "With": 44, "__init__": 45, "_build": 1, "_episod": 46, "_final_info": 46, "_final_observ": 46, "_forward_reward_weight": 44, "aama": 40, "abel": [13, 14, 15, 16], "about": [1, 5], "abov": 4, "acceler": [13, 14, 15], "accept": 44, "access": 44, "account": [4, 12], "achiev": 44, "act": [41, 42, 44], "action": [5, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 44, 45], "action_spac": 45, "ad": [17, 18, 22, 23, 45], "adapt": [6, 7, 8, 10], "add": [27, 28, 29, 30, 40, 44], "add_speed_object": [27, 28, 29, 30], "addit": 5, "addition": 44, "after": [9, 44, 46], "again": 4, "agent": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 36, 37, 44], "ai": 4, "al": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 35, 40], "alegr": [2, 12, 38, 40, 41], "algorithm": [39, 41], "align": 40, "all": [3, 17, 18, 36, 41, 43, 44, 46], "allow": 44, "also": [3, 16, 41, 42, 44], "altern": [27, 28, 29, 30], "alwai": [6, 7, 8], "amount": [16, 37], "an": [5, 10, 27, 28, 29, 30, 33, 36, 37, 41, 42, 44, 45, 46], "ana": [2, 38, 41], "andrea": 44, "andr\u00e9": 10, "angl": 32, "angular": 32, "ann": [2, 38, 41], "ansi": 37, "ansimuz": [6, 7, 8], "ant": 35, "antenv": [17, 18], "api": [39, 44, 45], "appear": 2, "appli": [4, 32, 46], "approach": 4, "approxim": 40, "ar": [3, 4, 13, 14, 15, 16, 36, 37, 44, 45, 46], "arm": 32, "arrai": [10, 17, 18, 19, 22, 23, 41, 42, 44, 45, 46], "art": [4, 6, 7, 8, 44], "artifici": 2, "asid": 3, "ask": 3, "asset": [4, 36, 44], "assist": [4, 6, 7, 8], "attribut": 45, "australia": 37, "author": [2, 38, 41], "autobuild": 1, "automat": [1, 44, 45], "avail": [44, 46], "avoid": [10, 16], "axel": [13, 14, 15], "axelabel": 3, "axi": [22, 23], "b": 1, "back": 44, "background": [6, 7, 8, 37], "backward": 5, "balanc": 44, "barret": 12, "barreto": 10, "barrett": 36, "base": [3, 4, 13, 14, 15, 32, 35, 37, 40, 44], "baselin": 44, "batteri": 44, "bazzan": [2, 38, 41], "becaus": 4, "been": [4, 5, 44], "befor": 46, "begin": 46, "behind": 5, "benchmark": [38, 40, 41], "benefit": 44, "benelearn": 2, "benelux": 2, "between": [33, 37, 41, 44, 46], "bib": 44, "binari": [10, 11, 12], "blob": [13, 14, 15], "blue": 10, "bnaic": [2, 40], "bnj6kubtg6": 41, "booktitl": [2, 38, 41], "bool": 46, "boolean": [4, 46], "bottl": 12, "bottle_reward": 4, "bottles_carri": 4, "bottles_deliv": [4, 12], "bottles_drop": 4, "bound": [37, 44], "box": [6, 7, 8, 17, 18, 19, 22, 23, 24, 26, 31, 34, 37], "brake": [13, 14, 15], "break": 44, "breakabl": 12, "breakablebottl": 4, "brisban": 37, "bro": 33, "bruno": [2, 38, 41], "budget": 40, "bugfix": 44, "bump": 44, "button": 44, "c": [2, 38, 41], "cai": 40, "calcul": 4, "call": 44, "callabl": 46, "can": [3, 4, 9, 11, 13, 14, 15, 27, 28, 29, 30, 37, 41, 42, 43, 44], "cannot": 4, "capabl": 44, "capac": [13, 14, 15], "car": [5, 27, 28, 29, 30, 44], "carb": [11, 12], "care": 46, "carri": 4, "cart": [13, 14, 15], "castelletti": 37, "catch": 9, "caus": 44, "cc": 44, "cd": 1, "cell": 12, "central": 32, "certain": [41, 43], "chanc": 12, "chang": [1, 6, 7, 8, 27, 28, 29, 30, 44], "changelog": 44, "check": [41, 42], "chose": 11, "ci": 44, "circl": 10, "citat": 44, "cite": 38, "class": [5, 41, 42, 46], "classic": [6, 7, 8, 45], "clip": 46, "close": 45, "co": [13, 14, 15, 32], "code": [3, 6, 7, 8, 9, 10, 13, 14, 15, 37, 44], "coin": [16, 33], "colab": [41, 42], "collect": [9, 10, 11, 12, 13, 14, 15, 16, 33, 36, 44], "collis": [16, 20], "com": [3, 13, 14, 15], "combin": 44, "commit": 44, "commun": [41, 44], "compar": 41, "complet": 46, "compliant": 41, "compon": [10, 44, 46], "compromis": 44, "comput": [32, 44, 45], "concav": [12, 44], "concave_map": [6, 7, 8], "conduct": 44, "confer": [2, 36, 37, 38, 41], "config": [13, 14, 15], "configur": [13, 14, 15], "conflict": 44, "conor": 3, "consequ": 44, "consist": 36, "constructor": 45, "consum": [13, 14, 15], "consumpt": [5, 13, 14, 15, 16], "contain": [1, 4, 10, 11, 12, 13, 14, 15, 27, 28, 29, 30, 31, 32, 39], "content": 37, "context": 44, "continu": [5, 6, 7, 8, 16, 31, 35, 37, 44], "contrari": 46, "contribut": [1, 3, 4, 44], "contributor": [3, 44], "control": [6, 7, 8, 9, 17, 18, 19, 22, 23, 24, 34], "control_cost": 44, "converg": 5, "convers": 44, "convex": [6, 7, 8], "coordin": [6, 7, 8, 36, 41], "copi": 46, "corner": [13, 14, 15], "correspond": [16, 27, 28, 29, 30, 37], "cost": [17, 18, 19, 22, 23, 24, 25, 26, 34, 37], "cost_flood": 16, "cost_object": [17, 18, 22, 23], "crash": [25, 26], "creat": [4, 6, 7, 8, 41, 42, 44], "creation": 44, "criteria": 36, "ctrl_cost": 44, "cumul": 46, "current": [4, 6, 7, 8, 37], "custom": 44, "d": [11, 12, 40], "da": [2, 38, 41], "dall": [4, 6, 7, 8], "dam": [16, 37], "danoi": [2, 38, 41], "deal": 45, "death": 16, "decis": 37, "decomposit": 40, "deep": [3, 12], "deep_sea_treasur": 44, "deepseatreasur": [6, 7, 8], "default": [6, 7, 8, 13, 14, 15, 27, 28, 29, 30, 37], "deficit": 37, "deficit_wat": 16, "defin": [4, 5, 16, 32, 45], "definit": [41, 42], "deliv": [4, 12], "demand": 37, "deni": [3, 9], "dens": [13, 14, 15], "depend": [41, 43], "deprec": 44, "depth": [11, 12], "deque_s": 46, "descript": [5, 12, 16, 35], "design": 44, "desir": 44, "destin": 12, "detail": [5, 41, 42], "determin": 44, "determinist": 44, "develop": 41, "di": 33, "diamond": 36, "dict": 4, "dictionari": [4, 12], "did": 4, "differ": [4, 12], "dim_reward": 46, "dimens": [4, 44], "dimension": [6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 32, 33, 34, 36], "directli": [44, 46], "directori": 45, "dirhtml": 1, "discord": [3, 41], "discount": [45, 46], "discret": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 21, 25, 27, 28, 29, 30, 32, 33, 35, 36, 44], "dissert": 5, "distanc": [32, 45], "distinct": 44, "distribut": 40, "do": 44, "doc": [1, 44], "document": [41, 45], "doe": [41, 43, 46], "doi": 37, "domain": 44, "done": 45, "dot": 46, "down": [6, 7, 8, 10, 36], "downstream": 37, "dr": 46, "drop": [4, 44], "dst": [12, 44], "dst_map": [6, 7, 8], "dtype": 44, "due": [5, 37], "dynmorl": 3, "e": [1, 2, 4, 6, 7, 8, 12, 31, 38, 41, 44], "each": [4, 6, 7, 8, 11, 13, 14, 15, 27, 28, 29, 30, 31, 32, 44], "eat": 12, "edit": 44, "effici": 40, "either": 9, "el": [2, 38, 41], "elaps": 46, "elbow": 32, "element": [36, 44], "els": [10, 33, 36], "enabl": 44, "end": [9, 13, 14, 15], "enemi": [4, 12, 16, 33, 36], "energi": 35, "engin": [25, 26], "entri": 40, "entry_point": 45, "env": [3, 5, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 35, 41, 42, 44, 45, 46], "env_fn": 46, "environ": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 40, 41, 42, 43, 46], "episod": [9, 37, 46], "epsilon": 46, "equival": 5, "esr": [12, 44], "essenti": [41, 45], "et": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 35, 40], "eval_mo": 44, "everi": [1, 11, 12], "exampl": [10, 39, 41, 42, 44], "excess": 37, "execut": [16, 37], "exhaust": 44, "expand": 44, "expect": 9, "extend": 44, "extra": [5, 27, 28, 29, 30], "ezpickl": 44, "f": [3, 37], "fair": 40, "fall": 44, "fals": [17, 18, 22, 23], "famili": [41, 43], "fan": 40, "fantasi": [6, 7, 8], "far": 33, "farama": [3, 13, 14, 15, 41, 44], "fast": [16, 44], "fat": [11, 12], "featur": [3, 10, 44], "feder": 40, "felten": [2, 12, 38, 40, 41], "felten_toolkit_2023": [38, 41], "few": [44, 46], "ffelten": 44, "file": [13, 14, 15, 44, 45], "fill": [13, 14, 15], "final_info": 46, "final_observ": 46, "finger_tip_coord": 32, "fire": 12, "first": [2, 13, 14, 15, 37, 40, 44, 46], "fish": [9, 12], "fish_amount": 12, "fisherman": 9, "fishproba": 9, "fishwood": [3, 12, 44], "fit": 37, "fix": 10, "flag": [4, 17, 18, 22, 23, 33, 36, 45], "flexibl": 44, "float": [37, 45, 46], "float32": [17, 18, 19, 22, 23, 24, 26, 31, 34, 37], "float_stat": [6, 7, 8], "flood": 37, "florian": [2, 38, 41], "folder": 1, "follow": [2, 10, 13, 14, 15, 17, 18, 19, 22, 23, 27, 28, 29, 30, 41, 42, 44, 45], "fork": 1, "form": 46, "formerli": [2, 40], "forward": [5, 19, 22, 23, 24, 27, 28, 29, 30, 34], "forward_penalti": 5, "forward_reward": 44, "foundat": [13, 14, 15, 44], "four": [3, 12, 32], "frame_skip": [13, 14, 15], "framework": 40, "from": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 36, 37, 44, 45, 46], "front": 45, "fruit": [3, 12], "fruit_tre": 44, "fuel": [5, 13, 14, 15, 16, 25, 26, 31], "fuel_consumption_penalti": 5, "full": [11, 12, 44], "function": [41, 42, 44], "g": [10, 12, 44], "gamma": [45, 46], "gather": [12, 44], "gem": [4, 12, 36], "gener": [40, 44, 45], "get": 44, "gg": 41, "ghazali": [2, 38, 41], "gif": 44, "gimelfarb": [3, 10], "github": [3, 13, 14, 15, 44], "give": 5, "go": [1, 9, 11, 22, 23, 27, 28, 29, 30], "goal": [10, 12, 27, 28, 29, 30, 31], "goe": 45, "goir": [2, 38, 41], "gold": [4, 12, 36], "gr": [2, 38, 41], "green": 10, "grid": [6, 7, 8], "gridworld": [10, 12], "ground": 4, "group": 44, "gt": 44, "guarante": 40, "guid": [41, 42], "gupta": 5, "gym": [2, 33, 40, 41, 42, 44], "gymnasium": [2, 5, 13, 14, 15, 16, 17, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 39, 40, 41, 42, 43, 45, 46], "ha": [4, 5, 33, 44], "halfcheetah": [35, 44], "halfcheetahenv": 19, "harder": 12, "hartmann": 40, "have": [3, 4, 5, 12, 41, 44], "hay": 3, "healthi": [17, 18], "height": 35, "help": 3, "here": [3, 10, 41, 42, 44], "high": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 44], "higher": 44, "highwai": [16, 44], "highwayenv": 20, "highwayfastenv": 21, "home": [4, 36], "hopper": [35, 44], "hopperenv": [22, 23], "hotfix": 44, "how": [1, 13, 14, 15, 33, 39], "http": [3, 4, 6, 7, 8, 13, 14, 15, 36, 37, 41], "human": [13, 14, 15, 37], "humanoid": 35, "humanoidenv": 24, "humonoid": 35, "hung": 5, "hydroelectr": 37, "hyperparamet": 40, "i": [1, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 39, 41, 42, 44, 45, 46], "ianleongudri": 44, "id": 45, "idx": 46, "igd": 45, "ijcnn": 37, "illustr": 44, "imag": [13, 14, 15, 16, 37], "image_observ": [13, 14, 15], "impact": 4, "implement": [4, 39, 45], "import": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 41, 42, 44, 45], "improv": 40, "includ": [16, 41, 43], "increment": [13, 14, 15], "incremental_frame_skip": [13, 14, 15], "index": 46, "indic": [4, 10, 36, 44], "inf": [4, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 32, 33, 34, 37], "info": [41, 42, 44, 45, 46], "info_dict": 44, "inform": [1, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 38, 41], "inher": 44, "inherit": 45, "init": 44, "initi": [37, 45], "initial_st": 37, "inproceed": [2, 38, 41], "inspir": 46, "instal": 1, "instanc": [41, 42, 44], "instead": [4, 44], "int": 46, "integ": 45, "integr": 44, "intellig": 2, "interact": [41, 42], "intern": [36, 37], "introduc": [5, 10, 44], "invert": 45, "io": [4, 6, 7, 8, 36], "itch": [4, 6, 7, 8, 36], "item": [10, 12], "item1": 12, "item2": 12, "item3": 12, "iter": [37, 46], "its": 45, "ivanov": 40, "join": [3, 41], "joint": [32, 37], "json": [13, 14, 15], "jump": [22, 23], "kallinteri": 44, "keep": 46, "kei": 4, "kill": [12, 33, 36], "klassert": 4, "known": 45, "kwarg": 45, "l": [2, 38, 41, 46], "lack": 5, "land": [5, 25, 26], "lander": [5, 44], "lane": [16, 20], "larger": 4, "leaf": [11, 12], "learn": [2, 4, 9, 10, 36, 38, 40, 41, 42, 44], "left": [4, 6, 7, 8, 10, 11, 13, 14, 15, 36], "length": 46, "leon": 36, "level": [37, 44], "leverag": 40, "librari": [2, 40, 41, 44], "life": 44, "light": 12, "like": [3, 41, 43, 46], "limezu": [4, 36], "limit": 16, "line": 45, "linear": [17, 18, 19, 22, 23], "linearli": 44, "linearreward": [17, 18, 19, 22, 23, 41, 42, 44], "linearwrapp": 44, "link": 44, "lint": 44, "list": [4, 44], "literatur": 44, "local": 5, "locat": [4, 12, 32], "logo": 44, "look": 46, "low": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37], "lower": 10, "luca": [2, 38, 41], "lucasalegr": 44, "lunar": [5, 44], "lunarland": [5, 25, 26], "m": 37, "machin": 36, "made": [1, 44], "mai": 44, "main": [3, 13, 14, 15, 25, 26], "main_engine_fuel": 5, "make": [1, 4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 41, 42, 44, 45, 46], "mani": [13, 14, 15], "map": [6, 7, 8, 10, 12, 13, 14, 15], "mario": [33, 44], "mark": 44, "markov": 37, "mathieu": [3, 37], "max": 46, "max_r": 46, "max_t": 9, "maxima": 5, "maximum": 37, "maze": 10, "md": [1, 44], "mdp": [41, 42, 44], "merg": [5, 27, 28, 29, 30], "merge_move_penalti": [27, 28, 29, 30], "method": [44, 45], "metric": 45, "mgoulao": 44, "mike": [3, 10], "min": 46, "min_r": 46, "mine": [13, 14, 15], "mine_config": [13, 14, 15], "minecart": [3, 16, 41, 42, 44], "miner": [11, 12], "minerium": [13, 14, 15], "minim": [13, 14, 15, 16], "minor": 44, "mirror": 12, "mirrored_map": [6, 7, 8], "miss": [40, 44], "mistak": 44, "mo": [2, 3, 5, 13, 14, 15, 16, 35, 39, 40, 41, 42, 43, 45, 46], "mo_gym": [17, 18, 19, 22, 23, 41, 42, 44], "mo_gymnasium": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 41, 42, 44, 45, 46], "mode": [13, 14, 15, 37], "model": [40, 41, 42], "modem": 40, "modifi": 44, "modul": 46, "mofl": 40, "momaxandskipobserv": 44, "momdp": [41, 42, 44], "monormalizereward": 44, "more": [1, 5, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 41, 42], "morecordepisodestatist": 44, "moreov": 45, "morewordstatist": 46, "morl": [3, 6, 7, 8, 9, 41, 42, 44], "mountain": [5, 27, 28, 29, 30, 31, 44], "mountaincar": [5, 31], "mountaincarcontinu": [5, 44], "move": [4, 5, 33, 36, 44], "move_penalti": 5, "much": 33, "mujoco": [32, 41, 43], "multi": [2, 5, 9, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 33, 34, 35, 37, 38, 40, 41, 42, 44, 45], "multibinari": 4, "multiobject": 4, "multipl": [4, 36, 39, 40, 44, 45, 46], "must": [12, 13, 14, 15, 16, 45], "my_env_dir": 45, "my_env_fil": 45, "my_env_v0": 45, "myenv": 45, "n": [2, 38, 41], "nO": 37, "narayanan": [12, 36], "ndarrai": 46, "need": 44, "neg": [10, 31, 32], "neighbour": 16, "network": 37, "neural": [37, 38, 41], "neurip": [38, 40, 41], "next": 45, "next_ob": [41, 42, 44], "ninjikin": [4, 36], "nip": 10, "node": 11, "none": [13, 14, 15, 37, 44, 46], "norm": 31, "normal": [37, 44, 46], "normalized_act": 37, "note": 4, "notebook": [41, 42], "now": [2, 38, 41, 44], "np": [17, 18, 19, 22, 23, 41, 42, 44], "num": 46, "num_env": 46, "number": [4, 37], "numpi": [41, 42, 44, 45, 46], "nutri1": 12, "nutri6": 12, "nutrient": [11, 12], "ob": [5, 12, 16, 35, 41, 42, 44], "object": [2, 5, 9, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 33, 34, 35, 37, 38, 40, 41, 42, 44, 45], "observ": [12, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 44, 45], "observation_spac": 45, "observationspac": 44, "off": 44, "oject": 45, "onc": 1, "one": [41, 43], "onli": 37, "open": [40, 41], "opengameart": 37, "optim": [36, 40, 44], "option": [27, 28, 29, 30, 41, 42, 44, 45], "order": 44, "ore1": 16, "ore2": 16, "ores": [13, 14, 15, 16], "org": [37, 41], "orient": [13, 14, 15], "origin": [4, 17, 18, 19, 22, 23, 41, 42, 44], "other": [16, 17, 18, 22, 23, 41, 42, 44, 46], "otherwis": [4, 9, 33], "our": [1, 44, 45], "out": [3, 37], "outcom": 4, "output": 46, "packag": [1, 44], "paper": 4, "pareto": [40, 45], "pareto_front": [44, 45], "parisi": 37, "part": [44, 45], "pass": [33, 44], "passag": 10, "path": [13, 14, 15], "paulina": 37, "penal": 37, "penalti": [4, 5, 6, 7, 8, 12, 27, 28, 29, 30, 31, 33], "peopl": 3, "percentag": 37, "perform": 45, "person": 40, "pf": 44, "pianosi": [16, 37], "pick": 4, "pip": [1, 41, 43], "pixel": [4, 6, 7, 8, 44], "plan": [41, 42], "pleas": [38, 40, 41], "plu": 10, "point": 33, "polici": [36, 40], "porcentag": [13, 14, 15], "port": 37, "posit": [5, 6, 7, 8, 10, 13, 14, 15, 32, 33, 36], "possibl": [4, 32], "potenti": [4, 12, 44], "pp": 37, "practic": [41, 42], "pranav": 5, "pre": 44, "predefin": 44, "prefer": 44, "prevent": 5, "previous": 44, "priorit": 40, "prob_drop": 4, "probabl": [4, 9], "problem": [4, 6, 7, 8, 9, 37, 44], "problemat": [41, 43], "proceed": [2, 36, 38, 41], "process": [38, 41], "product": 46, "project": 3, "protein": [11, 12], "provid": [3, 9, 41, 44], "public": [2, 41], "publish": 40, "pull": [40, 45], "py": 45, "pydoc": 44, "pypi": 44, "pytest": 45, "python": [41, 42, 44], "q": 37, "qld": 37, "qualiti": 44, "quantiti": [13, 14, 15], "question": 3, "r": [1, 46], "r_i": 32, "randint": 44, "random": 37, "rang": 44, "rather": 4, "reach": [3, 6, 7, 8, 10, 11, 12, 16, 27, 28, 29, 30, 31, 33, 44], "reacher": 35, "read": 5, "readm": 44, "reason": 5, "rebuild": 1, "receiv": [11, 44], "recov": [17, 18, 19, 22, 23], "red": 10, "refactor": [3, 13, 14, 15], "refer": 45, "registr": 45, "registri": 45, "reinforc": [2, 4, 9, 10, 38, 40, 41, 42, 44], "relax": [2, 38, 41], "releas": [16, 37], "reli": 44, "reliabl": [38, 40, 41], "remov": [27, 28, 29, 30], "remove_move_penalti": [27, 28, 29, 30], "renam": 44, "render": [13, 14, 15, 37, 45], "render_mod": [13, 14, 15, 37], "repeat": [13, 14, 15], "repositori": [38, 39, 41, 45], "repres": 44, "request": 40, "requir": 1, "research": [38, 40, 41], "reservoir": [3, 16, 44], "reset": [41, 42, 44, 45], "resourc": [12, 44], "restelli": 37, "retriev": [13, 14, 15], "return": [9, 13, 14, 15, 36, 41, 44, 45, 46], "revamp": 44, "revers": [4, 5, 27, 28, 29, 30], "reverse_penalti": 5, "reward": [5, 21, 41, 42, 44, 45, 46], "reward_dim": 45, "reward_spac": [44, 45], "reymond": [3, 37], "rgb": [13, 14], "rgb_arrai": [13, 14, 15, 37], "right": [4, 6, 7, 8, 10, 11, 13, 14, 15, 20, 36], "right_lan": 16, "rightest": 16, "riva": 37, "rl": 44, "robert": 4, "rodriguez": 40, "roijer": 12, "room": [3, 12], "root": [11, 44], "run": [19, 24, 34, 45, 46], "runzheyang": 3, "safeti": 4, "same": [6, 7, 8], "sampl": 40, "save": 44, "scalar": [17, 18, 19, 22, 23, 41, 42, 44, 46], "scenario": 44, "sea": [3, 12], "second": [13, 14, 15], "section": 4, "see": [10, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 41, 42, 44, 45], "seed": 45, "select": 37, "self": [44, 45], "separ": 10, "serenevillagerevamp": [4, 36], "serial": 46, "server": [3, 41], "set": [17, 18, 22, 23, 41, 44, 45], "setup": 44, "shape": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37, 45, 46], "shaped_reward": 5, "should": [44, 45], "shown": 44, "side": [25, 26], "side_engine_fuel": 5, "signal": 5, "silva": [2, 38, 41], "similar": 35, "similarli": [5, 16], "simon": 37, "simpl": [9, 41, 42], "simpli": 3, "sin": [13, 14, 15, 32], "sinc": [45, 46], "singl": [27, 28, 29, 30, 44], "size": [4, 11, 45], "sky": 37, "small": [4, 44], "snippet": 44, "so": 4, "some": [3, 41, 43, 45], "soto": 40, "sourc": [6, 7, 8, 10, 12, 13, 14, 15, 31, 41], "space": [5, 12, 16, 21, 35, 44, 45], "spars": [13, 14, 15], "specifi": 4, "speed": [5, 13, 14, 15, 16, 20, 27, 28, 29, 30, 44], "speed_object": 5, "spell": 44, "sphinx": 1, "split": 10, "squar": 10, "srini": 36, "stabl": 44, "stai": 16, "standard": [41, 44], "static": 5, "steckelmach": [3, 9], "step": [4, 5, 6, 7, 8, 9, 27, 28, 29, 30, 31, 33, 37, 40, 41, 42, 44, 45], "structur": 44, "submarin": [6, 7, 8, 12], "submiss": 40, "successfulli": [25, 26], "successor": [3, 10], "suit": 41, "super": 33, "supermario": [3, 16], "supermariobro": 33, "supermariobrosenv": 16, "suppli": 37, "support": 16, "swimmer": 35, "system": [38, 41, 43], "t": 46, "tailor": 44, "take": [4, 12], "taken": 12, "talbi": [2, 38, 41], "target": 32, "target_1": 35, "target_2": 35, "target_3": 35, "target_4": 35, "target_i": 32, "taxonomi": 40, "termin": [41, 42, 44, 45], "test": 44, "than": 4, "thank": 3, "thei": [44, 46], "them": [3, 4, 5, 41, 42], "therefor": 11, "thi": [1, 4, 38, 41, 42, 43, 44, 45, 46], "those": 10, "three": 12, "threshold": 37, "thrill": 44, "through": 45, "thu": 44, "ti": 45, "time": [1, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 27, 28, 29, 30, 31, 33, 46], "time_limit": 37, "time_penalti": [4, 5, 12], "timemov": 5, "timespe": 5, "tip": 32, "titl": [2, 38, 41], "tomekst": 44, "tool": 44, "toolkit": [38, 40, 41], "top": [27, 28, 29, 30, 31], "torqu": 32, "touch": 46, "track": 46, "trade": 44, "transfer": [3, 10], "transform": 44, "travel": 10, "treasur": [3, 4, 12, 36], "tree": [3, 12, 37], "triangl": 10, "true": [4, 6, 7, 8, 13, 14, 15, 37, 46], "truncat": [37, 41, 42, 44, 45], "tuto": 44, "tutori": 45, "two": [9, 13, 14, 15, 16, 32, 33, 37], "txt": 1, "type": [12, 13, 14, 15, 16, 44], "u": 3, "unbreakable_bottl": 4, "unbreakablebottl": 4, "under": [39, 44], "underwat": [6, 7, 8], "unpin": 44, "until": 37, "unwrap": 44, "up": [4, 6, 7, 8, 10, 36, 37], "updat": 44, "upper": [13, 14, 15], "upstream": 37, "us": [6, 7, 8, 13, 14, 15, 37, 38, 39, 40, 41, 42, 43, 44, 45], "user": 44, "util": [9, 44], "v0": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 21, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 41, 42], "v2": [5, 25, 26, 44], "v4": [17, 18, 19, 22, 23, 24, 32, 34, 35, 44], "valu": [4, 6, 7, 8, 11, 12, 40], "vamplew": [5, 12], "variou": [3, 39], "vecenv": 44, "vector": [10, 11, 13, 14, 15, 27, 28, 29, 30, 31, 33, 41, 44, 45, 46], "vector_reward": [41, 42, 44], "vectori": 44, "vehicl": 16, "veloc": [17, 18, 24, 32, 34, 35], "veri": [41, 42, 45], "version": [5, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 44], "via": 40, "vitamin": [11, 12], "wa": [3, 4, 5, 6, 7, 8, 13, 14, 15, 40, 44], "wai": [3, 10], "walker2d": 35, "walker2denv": 34, "wall": 10, "want": 3, "warn": [16, 44], "water": [3, 11, 12, 16, 44], "we": [3, 41, 44, 45], "websit": [41, 44], "weight": [17, 18, 19, 22, 23, 41, 42, 44, 46], "welfar": 40, "well": [41, 44, 45], "were": 10, "when": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 33, 36, 44, 45], "where": [6, 7, 8, 9, 11, 27, 28, 29, 30, 31, 44], "whether": [13, 14, 15, 37], "which": [4, 5, 6, 7, 8, 9, 10, 41, 44, 45, 46], "while": [4, 10, 12, 16], "within": [44, 45], "wood": [9, 12], "wood_amount": 12, "woodproba": 9, "work": 41, "worker": 44, "workshop": [2, 40], "world": [6, 7, 8], "would": 3, "wrap": [44, 46], "wrapper": [39, 41, 42, 44], "wrt": 37, "x": [6, 7, 8, 17, 18, 22, 23, 24, 33, 34, 36], "x_po": 16, "x_veloc": [35, 44], "xu": 35, "y": [6, 7, 8, 17, 18, 36], "y_veloc": 35, "yang": [6, 7, 8, 11, 12, 16], "year": [2, 38, 41], "you": [3, 38, 41, 42, 43, 44, 45], "your": [1, 38, 41], "your_ag": [41, 42, 44], "z": [22, 23], "zero": [32, 44]}, "titles": ["404 - Page Not Found", "MO-Gymnasium documentation", "<no title>", "Community", "Breakable-Bottles", "Classic Control", "Deep-Sea-Treasure", "Deep-Sea-Treasure-Concave", "Deep-Sea-Treasure-Mirrored", "Fishwood", "Four-Room", "Fruit-Tree", "Grid-World", "Minecart", "Minecart-Deterministic", "Minecart-Rgb", "Miscellaneous", "MO-Ant", "MO-Ant-2D", "MO-Halfcheetah", "MO-Highway", "MO-Highway-Fast", "MO-Hopper", "MO-Hopper-2D", "MO-Humanoid", "MO-Lunar-Lander", "MO-Lunar-Lander-Continuous", "MO-Mountaincar", "MO-Mountaincar-3D", "MO-Mountaincar-Timemove", "MO-Mountaincar-Timespeed", "MO-Mountaincarcontinuous", "MO-Reacher", "MO-Supermario", "MO-Walker2D", "MuJoCo", "Resource-Gathering", "Water-Reservoir", "Citation", "MORL Baselines", "List of Publications", "API", "API", "Install", "Release Notes", "Creating a custom environment", "Wrappers"], "titleterms": {"0": 44, "1": [44, 45], "2": [44, 45], "29": 44, "2d": [18, 23], "3": [44, 45], "3d": 28, "4": [44, 45], "404": 0, "Not": 0, "The": 0, "acknowledg": 3, "action": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 32, 36, 37], "ant": [17, 18], "api": [41, 42], "argument": [4, 6, 7, 8, 9, 10, 13, 14, 15, 37], "baselin": 39, "becom": 44, "better": 44, "bottl": [4, 44], "breakabl": [4, 44], "bug": 44, "build": 1, "citat": 38, "cite": 41, "class": 45, "classic": 5, "commun": 3, "concav": 7, "continu": 26, "control": 5, "could": 0, "creat": 45, "credit": [4, 6, 7, 8, 9, 10, 13, 14, 15, 36, 37], "custom": 45, "deep": [6, 7, 8, 44], "descript": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 32, 33, 34, 36, 37], "determinist": 14, "document": [1, 44], "environ": [44, 45], "episod": [4, 6, 7, 8, 10, 11, 13, 14, 15, 33, 36], "evalu": 44, "fast": 21, "fishwood": 9, "fix": 44, "found": 0, "four": 10, "front": 44, "fruit": [11, 44], "gather": 36, "grid": 12, "gymnasium": [1, 44], "halfcheetah": 19, "highwai": [20, 21], "hopper": [22, 23], "humanoid": 24, "improv": 44, "instal": [41, 43], "instanti": 45, "known": 44, "lander": [25, 26], "linearreward": 46, "list": 40, "lunar": [25, 26], "matur": 44, "migrat": 44, "minecart": [13, 14, 15], "mirror": [8, 44], "miscellan": 16, "mo": [1, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 44], "moclipreward": 46, "monormalizereward": 46, "more": 44, "morecordepisodestatist": 46, "morl": 39, "mosyncvectorenv": 46, "mountaincar": [27, 28, 29, 30], "mountaincarcontinu": 31, "mujoco": [35, 44], "new": [44, 45], "note": 44, "observ": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 32, 36, 37], "page": [0, 44], "pareto": 44, "polici": 44, "public": 40, "pygam": 44, "reacher": [32, 44], "refer": 10, "regist": 45, "releas": 44, "render": 44, "request": 0, "reservoir": 37, "resourc": 36, "reward": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37], "rgb": 15, "room": 10, "sea": [6, 7, 8, 44], "space": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 36, 37], "start": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 36, 37], "state": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 36, 37], "supermario": 33, "support": 44, "termin": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 33, 36], "test": 45, "timemov": 29, "timespe": 30, "treasur": [6, 7, 8, 44], "tree": [11, 44], "v0": 44, "v1": 44, "walker2d": 34, "water": 37, "webpag": 44, "world": 12, "wrapper": 46, "your": 45}}) \ No newline at end of file +Search.setIndex({"alltitles": {"0.1.1": [[45, "release-0-1-1"]], "0.1.2": [[45, "release-0-1-2"]], "0.2.0": [[45, "release-0-2-0"]], "0.2.1": [[45, "release-0-2-1"]], "1. Create a new environment class": [[46, "create-a-new-environment-class"]], "2. Register the environment": [[46, "register-the-environment"]], "3. Test the environment": [[46, "test-the-environment"]], "4. Instantiate your environment": [[46, "instantiate-your-environment"]], "404 - Page Not Found": [[0, null]], "API": [[42, null], [43, null]], "Acknowledgements": [[3, "acknowledgements"]], "Action Space": [[4, "action-space"], [6, "action-space"], [7, "action-space"], [8, "action-space"], [9, "action-space"], [10, "action-space"], [11, "action-space"], [13, "action-space"], [14, "action-space"], [15, "action-space"], [32, "action-space"], [37, "action-space"], [38, "action-space"]], "Arguments": [[4, "arguments"], [6, "arguments"], [7, "arguments"], [8, "arguments"], [9, "arguments"], [10, "arguments"], [13, "arguments"], [14, "arguments"], [15, "arguments"], [38, "arguments"]], "Breakable-Bottles": [[4, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Citation": [[39, null]], "Citing": [[42, "citing"]], "Classic Control": [[5, null]], "Community": [[3, null]], "Creating a custom environment": [[46, null]], "Credits": [[4, "credits"], [6, "credits"], [7, "credits"], [8, "credits"], [9, "credits"], [10, "credits"], [13, "credits"], [14, "credits"], [15, "credits"], [37, "credits"], [38, "credits"]], "Deep-Sea-Treasure": [[6, null]], "Deep-Sea-Treasure-Concave": [[7, null]], "Deep-Sea-Treasure-Mirrored": [[8, null]], "Description": [[4, "description"], [6, "description"], [7, "description"], [8, "description"], [9, "description"], [10, "description"], [11, "description"], [13, "description"], [14, "description"], [15, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [22, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [37, "description"], [38, "description"]], "Episode Termination": [[4, "episode-termination"], [6, "episode-termination"], [7, "episode-termination"], [8, "episode-termination"], [10, "episode-termination"], [11, "episode-termination"], [13, "episode-termination"], [14, "episode-termination"], [15, "episode-termination"], [33, "episode-termination"], [37, "episode-termination"]], "Fishwood": [[9, null]], "Four-Room": [[10, null]], "Fruit-Tree": [[11, null]], "Grid-World": [[12, null]], "Install": [[42, "install"], [44, null]], "LinearReward": [[48, "linearreward"]], "List of Publications": [[41, null]], "MO-Ant": [[17, null]], "MO-Ant-2D": [[18, null]], "MO-Gymnasium 0.3.0 Release: Migrate to Gymnasium": [[45, "release-0-3-0"]], "MO-Gymnasium 0.3.1 Release: Improved documentation and MuJoco MO-Reacher environment": [[45, "release-0-3-1"]], "MO-Gymnasium 0.3.2 Release: Bug fixes, improved webpage": [[45, "release-0-3-2"]], "MO-Gymnasium documentation": [[1, null]], "MO-Halfcheetah": [[19, null]], "MO-Highway": [[20, null]], "MO-Highway-Fast": [[21, null]], "MO-Hopper": [[22, null]], "MO-Hopper-2D": [[23, null]], "MO-Humanoid": [[24, null]], "MO-Lunar-Lander": [[25, null]], "MO-Lunar-Lander-Continuous": [[26, null]], "MO-Mountaincar": [[27, null]], "MO-Mountaincar-3D": [[28, null]], "MO-Mountaincar-Timemove": [[29, null]], "MO-Mountaincar-Timespeed": [[30, null]], "MO-Mountaincarcontinuous": [[31, null]], "MO-Reacher": [[32, null]], "MO-Supermario": [[33, null]], "MO-Swimmer": [[34, null]], "MO-Walker2D": [[35, null]], "MOClipReward": [[48, "moclipreward"]], "MOMaxAndSkipObservation": [[48, "momaxandskipobservation"]], "MONormalizeReward": [[48, "monormalizereward"]], "MORL Baselines": [[40, null]], "MORecordEpisodeStatistics": [[47, "morecordepisodestatistics"], [48, "morecordepisodestatistics"]], "MOSyncVectorEnv": [[47, "mosyncvectorenv"]], "Minecart": [[13, null]], "Minecart-Deterministic": [[14, null]], "Minecart-Rgb": [[15, null]], "Miscellaneous": [[16, null]], "MuJoCo": [[36, null]], "Observation Space": [[4, "observation-space"], [6, "observation-space"], [7, "observation-space"], [8, "observation-space"], [9, "observation-space"], [10, "observation-space"], [11, "observation-space"], [13, "observation-space"], [14, "observation-space"], [15, "observation-space"], [32, "observation-space"], [37, "observation-space"], [38, "observation-space"]], "References": [[10, "references"]], "Release Notes": [[45, null]], "Resource-Gathering": [[37, null]], "Reward Space": [[4, "reward-space"], [6, "reward-space"], [7, "reward-space"], [8, "reward-space"], [9, "reward-space"], [10, "reward-space"], [11, "reward-space"], [13, "reward-space"], [14, "reward-space"], [15, "reward-space"], [17, "reward-space"], [18, "reward-space"], [19, "reward-space"], [20, "reward-space"], [22, "reward-space"], [23, "reward-space"], [24, "reward-space"], [25, "reward-space"], [26, "reward-space"], [32, "reward-space"], [33, "reward-space"], [34, "reward-space"], [35, "reward-space"], [37, "reward-space"], [38, "reward-space"]], "Reward space:": [[27, "reward-space"], [28, "reward-space"], [29, "reward-space"], [30, "reward-space"], [31, "reward-space"]], "Starting State": [[4, "starting-state"], [6, "starting-state"], [7, "starting-state"], [8, "starting-state"], [9, "starting-state"], [10, "starting-state"], [11, "starting-state"], [13, "starting-state"], [14, "starting-state"], [15, "starting-state"], [37, "starting-state"], [38, "starting-state"]], "Termination": [[9, "termination"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Vector Wrappers": [[47, null]], "Water-Reservoir": [[38, null]], "Wrappers": [[48, null]], "v0.3.3: MO-Gymnasium 0.3.3 Release: Policy Evaluation bug fix, better documentation page": [[45, "release-v0-3-3"]], "v0.3.4: MO-Gymnasium 0.3.4 Release: Known Pareto Front, improved renders and documentation": [[45, "release-v0-3-4"]], "v1.0.0: MO-Gymnasium becomes mature": [[45, "release-v1-0-0"]], "v1.0.1: MO-Gymnasium 1.0.1 Release: Support Gymnasium 0.29, breakable-bottles pygame render, and more": [[45, "release-v1-0-1"]], "v1.1.0: MO-Gymnasium 1.1.0 Release: New MuJoCo environments, Mirrored Deep Sea Treasure, Fruit Tree rendering, and more": [[45, "release-v1-1-0"]]}, "docnames": ["404", "README", "citing/citing", "community/community", "environments/breakable-bottles", "environments/classical", "environments/deep-sea-treasure", "environments/deep-sea-treasure-concave", "environments/deep-sea-treasure-mirrored", "environments/fishwood", "environments/four-room", "environments/fruit-tree", "environments/grid-world", "environments/minecart", "environments/minecart-deterministic", "environments/minecart-rgb", "environments/misc", "environments/mo-ant", "environments/mo-ant-2d", "environments/mo-halfcheetah", "environments/mo-highway", "environments/mo-highway-fast", "environments/mo-hopper", "environments/mo-hopper-2d", "environments/mo-humanoid", "environments/mo-lunar-lander", "environments/mo-lunar-lander-continuous", "environments/mo-mountaincar", "environments/mo-mountaincar-3d", "environments/mo-mountaincar-timemove", "environments/mo-mountaincar-timespeed", "environments/mo-mountaincarcontinuous", "environments/mo-reacher", "environments/mo-supermario", "environments/mo-swimmer", "environments/mo-walker2d", "environments/mujoco", "environments/resource-gathering", "environments/water-reservoir", "examples/citation", "examples/morl_baselines", "examples/publications", "index", "introduction/api", "introduction/install", "release_notes", "tutorials/custom_env", "wrappers/vector_wrappers", "wrappers/wrappers"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["404.md", "README.md", "citing/citing.md", "community/community.md", "environments/breakable-bottles.md", "environments/classical.md", "environments/deep-sea-treasure.md", "environments/deep-sea-treasure-concave.md", "environments/deep-sea-treasure-mirrored.md", "environments/fishwood.md", "environments/four-room.md", "environments/fruit-tree.md", "environments/grid-world.md", "environments/minecart.md", "environments/minecart-deterministic.md", "environments/minecart-rgb.md", "environments/misc.md", "environments/mo-ant.md", "environments/mo-ant-2d.md", "environments/mo-halfcheetah.md", "environments/mo-highway.md", "environments/mo-highway-fast.md", "environments/mo-hopper.md", "environments/mo-hopper-2d.md", "environments/mo-humanoid.md", "environments/mo-lunar-lander.md", "environments/mo-lunar-lander-continuous.md", "environments/mo-mountaincar.md", "environments/mo-mountaincar-3d.md", "environments/mo-mountaincar-timemove.md", "environments/mo-mountaincar-timespeed.md", "environments/mo-mountaincarcontinuous.md", "environments/mo-reacher.md", "environments/mo-supermario.md", "environments/mo-swimmer.md", "environments/mo-walker2d.md", "environments/mujoco.md", "environments/resource-gathering.md", "environments/water-reservoir.md", "examples/citation.md", "examples/morl_baselines.md", "examples/publications.md", "index.md", "introduction/api.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "wrappers/vector_wrappers.md", "wrappers/wrappers.md"], "indexentries": {"linearreward (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.LinearReward", false]], "moclipreward (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.MOClipReward", false]], "momaxandskipobservation (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.MOMaxAndSkipObservation", false]], "monormalizereward (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.MONormalizeReward", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.MORecordEpisodeStatistics", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers.vector)": [[47, "mo_gymnasium.wrappers.vector.MORecordEpisodeStatistics", false]], "mosyncvectorenv (class in mo_gymnasium.wrappers.vector)": [[47, "mo_gymnasium.wrappers.vector.MOSyncVectorEnv", false]]}, "objects": {"mo_gymnasium.wrappers": [[48, 0, 1, "", "LinearReward"], [48, 0, 1, "", "MOClipReward"], [48, 0, 1, "", "MOMaxAndSkipObservation"], [48, 0, 1, "", "MONormalizeReward"], [48, 0, 1, "", "MORecordEpisodeStatistics"]], "mo_gymnasium.wrappers.vector": [[47, 0, 1, "", "MORecordEpisodeStatistics"], [47, 0, 1, "", "MOSyncVectorEnv"]]}, "objnames": {"0": ["py", "class", "Python class"]}, "objtypes": {"0": "py:class"}, "terms": {"": [4, 5, 6, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 35, 42, 43, 48], "0": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 47, 48], "01": 45, "02": 45, "03": 45, "06": 45, "07": [27, 28, 29, 30, 31], "08": [45, 48], "09": 45, "1": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 47, 48], "10": [6, 7, 8, 11, 12, 25, 26, 37, 38], "100": [25, 26, 33, 47, 48], "11": [6, 7, 22, 23, 45], "1109": 38, "1145": 37, "12": 45, "124": [7, 8], "13": [10, 45], "1390156": 37, "1390162": 37, "14": [10, 45], "16": 45, "160": 38, "17": [19, 24, 35], "18": 45, "19": 45, "1e": [34, 48], "2": [4, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 47], "20": [8, 45], "200": 9, "2008": [12, 37], "2010": 12, "2011": 5, "2012": 38, "2013": 16, "2017": 10, "2018": 12, "2019": [6, 7, 8, 11, 12, 13, 14, 15, 16], "2020": 36, "2021": 12, "2022": [2, 5, 12, 41, 45], "2022bnaic": 2, "2023": [39, 41, 42, 45], "2024": [41, 45], "21": 45, "23": [6, 45], "24": 45, "240": [4, 33], "25": [33, 45], "255": [15, 33], "256": 33, "25th": 37, "26": 45, "27": [17, 18, 45], "28": [25, 26], "2d": [6, 7, 8, 10, 13, 14, 15, 31, 45, 47], "3": [4, 6, 7, 8, 10, 13, 14, 15, 17, 18, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 32, 33, 37, 38, 47], "30": 45, "31": 45, "33": 45, "34": 45, "34th": 2, "35": 45, "360": 4, "37": 45, "376": 24, "37th": [39, 42], "3d": [5, 13, 14, 15, 27, 29, 30], "4": [4, 6, 7, 8, 10, 13, 14, 15, 24, 25, 26, 32, 33, 34, 37, 38, 47, 48], "40": 45, "41": [37, 45], "42": [45, 47], "43": 45, "45": 45, "46": 45, "47": [37, 45], "480": 15, "5": [4, 11, 12, 13, 14, 15, 20, 21, 25, 26, 33, 37, 45], "50": [4, 45], "51": 45, "52": 45, "53": 45, "55": 45, "56": 45, "57": 45, "58": 45, "59": 45, "6": [11, 12, 13, 14, 15, 19, 25, 26, 27, 28, 29, 30, 31, 32, 35], "60": 45, "61": 45, "62": 45, "6252759": 38, "63": 11, "64": 45, "65": 45, "67": 45, "69": 45, "7": [6, 11, 12, 13, 14, 15, 45, 47], "70": 45, "72": 45, "73": 45, "74": 45, "75": 45, "76": 45, "77": 45, "79": 45, "8": [17, 18, 25, 26, 34, 38, 42, 43, 45], "80": 45, "81": 45, "83": 45, "84": 45, "86": 45, "87": 45, "9": 32, "99": 48, "A": [2, 4, 10, 16, 17, 18, 21, 27, 28, 29, 30, 31, 38, 39, 41, 42, 43, 48], "As": [4, 42, 43], "At": 47, "But": 48, "By": [27, 28, 29, 30, 38], "For": [1, 32, 42, 43, 45, 47], "If": [3, 13, 14, 15, 17, 18, 22, 23, 38, 39, 42, 46], "In": [4, 45], "It": [40, 42, 43, 45, 46], "Of": 45, "The": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 31, 32, 33, 34, 35, 37, 38, 42, 45, 46, 47], "There": 38, "To": [1, 6, 7, 8, 42, 44], "With": 45, "_": 47, "__init__": 46, "_build": 1, "_episod": 47, "_forward_reward_weight": 45, "_modul": 48, "aama": 41, "abel": [13, 14, 15, 16], "about": [1, 5], "abov": 4, "acceler": [13, 14, 15], "accept": 45, "access": [45, 47], "account": [4, 12], "achiev": 45, "act": [42, 43, 45], "action": [5, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 45, 46, 47], "action_spac": [46, 47], "acttyp": 48, "ad": [17, 18, 22, 23, 46, 47], "adapt": [6, 7, 8, 10], "add": [27, 28, 29, 30, 41, 45], "add_speed_object": [27, 28, 29, 30], "addit": 5, "addition": 45, "after": [9, 45, 48], "again": 4, "agent": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 37, 38, 45], "ai": 4, "al": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 36, 41], "alegr": [2, 12, 39, 41, 42], "algorithm": [40, 42], "align": 41, "all": [3, 17, 18, 37, 42, 44, 45, 47, 48], "allow": 45, "also": [3, 16, 42, 43, 45], "altern": [27, 28, 29, 30], "alwai": [6, 7, 8], "amount": [16, 38], "an": [5, 10, 27, 28, 29, 30, 33, 37, 38, 42, 43, 45, 46, 48], "ana": [2, 39, 42], "andrea": 45, "andr\u00e9": 10, "angl": 32, "angular": 32, "ani": 47, "ann": [2, 39, 42], "ansi": 38, "ansimuz": [6, 7, 8], "ant": 36, "antenv": [17, 18], "api": [40, 45, 46], "appear": 2, "appli": [4, 32, 47], "approach": 4, "approxim": 41, "ar": [3, 4, 13, 14, 15, 16, 37, 38, 45, 46, 47, 48], "arm": 32, "arrai": [10, 17, 18, 19, 22, 23, 34, 42, 43, 45, 46, 47, 48], "art": [4, 6, 7, 8, 45], "artifici": 2, "asid": 3, "ask": 3, "asset": [4, 37, 45], "assist": [4, 6, 7, 8], "atari_wrapp": 48, "attribut": 46, "australia": 38, "author": [2, 39, 42], "autobuild": 1, "automat": [1, 45, 46], "avail": [45, 47, 48], "averag": 48, "avoid": [10, 16], "axel": [13, 14, 15], "axelabel": 3, "axi": [22, 23], "b": 1, "back": 45, "background": [6, 7, 8, 38], "backward": 5, "balanc": 45, "barret": 12, "barreto": 10, "barrett": 37, "base": [3, 4, 13, 14, 15, 32, 36, 38, 41, 45, 48], "baselin": 45, "baselines3": 48, "batteri": 45, "bazzan": [2, 39, 42], "becaus": 4, "been": [4, 5, 45], "befor": 47, "begin": [47, 48], "behind": 5, "benchmark": [39, 41, 42], "benefit": 45, "benelearn": 2, "benelux": 2, "between": [33, 38, 42, 45, 48], "bib": 45, "binari": [10, 11, 12], "blob": [13, 14, 15], "blue": 10, "bnaic": [2, 41], "bnj6kubtg6": 42, "booktitl": [2, 39, 42], "bool": 47, "boolean": [4, 47], "both": 48, "both_norm_env": 48, "bottl": 12, "bottle_reward": 4, "bottles_carri": 4, "bottles_deliv": [4, 12], "bottles_drop": 4, "bound": [38, 45], "box": [6, 7, 8, 17, 18, 19, 22, 23, 24, 26, 31, 34, 35, 38], "brake": [13, 14, 15], "break": 45, "breakabl": 12, "breakablebottl": 4, "brisban": 38, "bro": 33, "bruno": [2, 39, 42], "budget": 41, "buffer": 47, "buffer_length": [47, 48], "bugfix": 45, "bump": 45, "button": 45, "c": [2, 39, 42], "cai": 41, "calcul": 4, "call": 45, "callabl": 47, "can": [3, 4, 9, 11, 13, 14, 15, 27, 28, 29, 30, 38, 42, 43, 44, 45, 47, 48], "cannot": 4, "capabl": 45, "capac": [13, 14, 15], "car": [5, 27, 28, 29, 30, 45], "carb": [11, 12], "care": 47, "carri": 4, "cart": [13, 14, 15], "castelletti": 38, "catch": 9, "caus": 45, "cc": 45, "cd": 1, "cell": 12, "central": 32, "certain": [42, 44], "chanc": 12, "chang": [1, 6, 7, 8, 27, 28, 29, 30, 45], "changelog": 45, "check": [42, 43], "chose": 11, "ci": 45, "circl": 10, "citat": 45, "cite": 39, "class": [5, 42, 43, 47, 48], "classic": [6, 7, 8, 46], "clip": 48, "close": 46, "co": [13, 14, 15, 32], "code": [3, 6, 7, 8, 9, 10, 13, 14, 15, 38, 45, 48], "coin": [16, 33], "colab": [42, 43], "collect": [9, 10, 11, 12, 13, 14, 15, 16, 33, 37, 45], "collis": [16, 20], "com": [3, 13, 14, 15], "combin": 45, "commit": 45, "common": 48, "commun": [42, 45], "compar": 42, "complet": 48, "compliant": 42, "compon": [10, 45, 48], "compromis": 45, "comput": [32, 45, 46], "concav": [12, 45], "concave_map": [6, 7, 8], "conduct": 45, "confer": [2, 37, 38, 39, 42], "config": [13, 14, 15], "configur": [13, 14, 15], "conflict": 45, "conor": 3, "consequ": 45, "consist": 37, "constructor": 46, "consum": [13, 14, 15], "consumpt": [5, 13, 14, 15, 16], "contain": [1, 4, 10, 11, 12, 13, 14, 15, 27, 28, 29, 30, 31, 32, 40], "content": 38, "context": 45, "continu": [5, 6, 7, 8, 16, 31, 36, 38, 45], "contribut": [1, 3, 4, 45], "contributor": [3, 45], "control": [6, 7, 8, 9, 17, 18, 19, 22, 23, 24, 34, 35], "control_cost": 45, "converg": 5, "convers": 45, "convex": [6, 7, 8], "coordin": [6, 7, 8, 37, 42], "copi": 47, "corner": [13, 14, 15], "correspond": [16, 27, 28, 29, 30, 38], "cost": [17, 18, 19, 22, 23, 24, 25, 26, 34, 35, 38], "cost_flood": 16, "cost_object": [17, 18, 22, 23], "crash": [25, 26], "creat": [4, 6, 7, 8, 42, 43, 45], "creation": 45, "criteria": 37, "ctrl_cost": 45, "cumul": [47, 48], "current": [4, 6, 7, 8, 38], "custom": 45, "d": [11, 12, 41], "da": [2, 39, 42], "dall": [4, 6, 7, 8], "dam": [16, 38], "danoi": [2, 39, 42], "deal": 46, "death": 16, "decis": 38, "decomposit": 41, "deep": [3, 12, 47, 48], "deep_sea_treasur": 45, "deepseatreasur": [6, 7, 8], "default": [6, 7, 8, 13, 14, 15, 27, 28, 29, 30, 38], "deficit": 38, "deficit_wat": 16, "defin": [4, 5, 16, 32, 46], "definit": [42, 43], "deliv": [4, 12], "demand": 38, "deni": [3, 9], "dens": [13, 14, 15], "depend": [42, 44], "deprec": 45, "depth": [11, 12], "deque_s": 47, "descript": [5, 12, 16, 36], "design": [45, 47], "desir": 45, "destin": 12, "detail": [5, 42, 43], "determin": 45, "determinist": 45, "develop": 42, "deviat": 48, "di": 33, "diamond": 37, "dict": 4, "dictionari": [4, 12], "did": 4, "differ": [4, 12], "dim_reward": 47, "dimens": [4, 45], "dimension": [6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 32, 33, 34, 35, 37], "directli": [45, 47, 48], "directori": 46, "dirhtml": 1, "discord": [3, 42], "discount": [46, 47, 48], "discret": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 21, 25, 27, 28, 29, 30, 32, 33, 36, 37, 45], "dissert": 5, "distanc": [32, 46], "distinct": 45, "distribut": 41, "do": 45, "doc": [1, 45], "document": [42, 46], "doe": [42, 44, 48], "doi": 38, "domain": 45, "done": [46, 47], "dot": 48, "down": [6, 7, 8, 10, 37], "downstream": 38, "dr": [47, 48], "drop": [4, 45], "dst": [12, 45], "dst_map": [6, 7, 8], "dtype": [45, 47], "due": [5, 38], "dynmorl": 3, "e": [1, 2, 4, 6, 7, 8, 12, 31, 39, 42, 45], "each": [4, 6, 7, 8, 11, 13, 14, 15, 27, 28, 29, 30, 31, 32, 45, 47], "eat": 12, "edit": 45, "effici": 41, "either": 9, "el": [2, 39, 42], "elaps": [47, 48], "elbow": 32, "element": [37, 45], "els": [10, 33, 37], "en": 48, "enabl": 45, "end": [9, 13, 14, 15, 47], "enemi": [4, 12, 16, 33, 37], "energi": 36, "engin": [25, 26], "entri": 41, "entry_point": 46, "env": [3, 5, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 35, 36, 42, 43, 45, 46, 47, 48], "env_fn": 47, "environ": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 44, 47], "episod": [9, 38, 47, 48], "epsilon": 48, "equival": 5, "esr": [12, 45], "essenti": [42, 46], "et": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 36, 41], "eval_mo": 45, "everi": [1, 11, 12, 48], "exampl": [10, 40, 42, 43, 45, 47, 48], "except": 48, "excess": 38, "execut": [16, 38], "exhaust": 45, "expand": 45, "expect": 9, "extend": 45, "extra": [5, 27, 28, 29, 30], "extract": 48, "ezpickl": 45, "f": [3, 38], "fair": 41, "fall": 45, "fals": [17, 18, 22, 23, 47], "famili": [42, 44], "fan": 41, "fantasi": [6, 7, 8], "far": 33, "farama": [3, 13, 14, 15, 42, 45], "fast": [16, 45], "fat": [11, 12], "featur": [3, 10, 45], "feder": 41, "felten": [2, 12, 39, 41, 42], "felten_toolkit_2023": [39, 42], "few": [45, 47, 48], "ffelten": 45, "file": [13, 14, 15, 45, 46], "fill": [13, 14, 15], "finger_tip_coord": 32, "fire": 12, "first": [2, 13, 14, 15, 38, 41, 45, 47], "fish": [9, 12], "fish_amount": 12, "fisherman": 9, "fishproba": 9, "fishwood": [3, 12, 45], "fit": 38, "fix": 10, "flag": [4, 17, 18, 22, 23, 33, 37, 46], "flexibl": 45, "float": [38, 46, 47, 48], "float32": [17, 18, 19, 22, 23, 24, 26, 31, 34, 35, 38, 47], "float_stat": [6, 7, 8], "flood": 38, "florian": [2, 39, 42], "folder": 1, "follow": [2, 10, 13, 14, 15, 17, 18, 19, 22, 23, 27, 28, 29, 30, 34, 42, 43, 45, 46], "fork": 1, "form": 47, "formerli": [2, 41], "forward": [5, 19, 22, 23, 24, 27, 28, 29, 30, 34, 35], "forward_penalti": 5, "forward_reward": 45, "foundat": [13, 14, 15, 45], "four": [3, 12, 32], "frame": 48, "frame_skip": [13, 14, 15], "frameskip": 48, "framework": 41, "from": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 37, 38, 45, 46, 47, 48], "front": 46, "fruit": [3, 12], "fruit_tre": 45, "fuel": [5, 13, 14, 15, 16, 25, 26, 31], "fuel_consumption_penalti": 5, "full": [11, 12, 45], "function": [42, 43, 45], "g": [10, 12, 45], "gamma": [46, 47, 48], "gather": [12, 45], "gem": [4, 12, 37], "gener": [41, 45, 46], "get": 45, "gg": 42, "ghazali": [2, 39, 42], "gif": 45, "gimelfarb": [3, 10], "github": [3, 13, 14, 15, 45], "give": 5, "given": 48, "go": [1, 9, 11, 22, 23, 27, 28, 29, 30], "goal": [10, 12, 27, 28, 29, 30, 31], "goe": 46, "goir": [2, 39, 42], "gold": [4, 12, 37], "gr": [2, 39, 42], "green": 10, "grid": [6, 7, 8], "gridworld": [10, 12], "ground": 4, "group": 45, "gt": 45, "guarante": 41, "guid": [42, 43], "gupta": 5, "gym": [2, 33, 41, 42, 43, 45], "gymnasium": [2, 5, 13, 14, 15, 16, 17, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 35, 40, 41, 42, 43, 44, 46, 47, 48], "ha": [4, 5, 33, 45, 47], "halfcheetah": [36, 45], "halfcheetahenv": 19, "harder": 12, "hartmann": 41, "have": [3, 4, 5, 12, 42, 45, 48], "hay": 3, "healthi": [17, 18], "heavili": 48, "height": 36, "help": 3, "here": [3, 10, 42, 43, 45], "high": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 45], "higher": 45, "highwai": [16, 45], "highwayenv": 20, "highwayfastenv": 21, "home": [4, 37], "hopper": [36, 45], "hopperenv": [22, 23], "hotfix": 45, "how": [1, 13, 14, 15, 33, 40], "html": 48, "http": [3, 4, 6, 7, 8, 13, 14, 15, 37, 38, 42, 48], "human": [13, 14, 15, 38], "humanoid": 36, "humanoidenv": 24, "humonoid": 36, "hung": 5, "hydroelectr": 38, "hyperparamet": 41, "i": [1, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 40, 42, 43, 45, 46, 47, 48], "ianleongudri": 45, "id": 46, "idx": 48, "igd": 46, "ijcnn": 38, "illustr": 45, "imag": [13, 14, 15, 16, 38], "image_observ": [13, 14, 15], "impact": 4, "implement": [4, 40, 46], "import": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 45, 46, 47, 48], "improv": 41, "includ": [16, 42, 44], "increment": [13, 14, 15], "incremental_frame_skip": [13, 14, 15], "index": [47, 48], "indic": [4, 10, 37, 45, 47], "inf": [4, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 32, 33, 34, 35, 38], "info": [42, 43, 45, 46, 47, 48], "info_dict": 45, "inform": [1, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 39, 42], "inher": 45, "inherit": 46, "init": 45, "initi": [38, 46], "initial_st": 38, "inproceed": [2, 39, 42], "inspir": 48, "instal": 1, "instanc": [42, 43, 45], "instead": [4, 45], "int": [47, 48], "int32": 47, "integ": 46, "integr": 45, "intellig": 2, "interact": [42, 43], "intern": [37, 38], "introduc": [5, 10, 45], "invert": 46, "io": [4, 6, 7, 8, 37, 48], "itch": [4, 6, 7, 8, 37], "item": [10, 12], "item1": 12, "item2": 12, "item3": 12, "iter": [38, 47], "its": 46, "ivanov": 41, "join": [3, 42], "joint": [32, 38], "json": [13, 14, 15], "jump": [22, 23], "kallinteri": 45, "keep": [47, 48], "kei": [4, 47], "kill": [12, 33, 37], "klassert": 4, "known": 46, "kwarg": 46, "l": [2, 39, 42, 47, 48], "lack": 5, "lambda": 47, "land": [5, 25, 26], "lander": [5, 45], "lane": [16, 20], "larger": 4, "last": [47, 48], "leaf": [11, 12], "learn": [2, 4, 9, 10, 37, 39, 41, 42, 43, 45], "left": [4, 6, 7, 8, 10, 11, 13, 14, 15, 37], "length": [47, 48], "length_queu": 47, "leon": 37, "level": [38, 45], "leverag": 41, "librari": [2, 41, 42, 45], "life": 45, "light": 12, "like": [3, 42, 44, 48], "limezu": [4, 37], "limit": 16, "line": 46, "linear": [17, 18, 19, 22, 23, 34], "linearli": 45, "linearreward": [17, 18, 19, 22, 23, 34, 42, 43, 45], "linearwrapp": 45, "link": 45, "lint": 45, "list": [4, 45], "literatur": 45, "local": 5, "locat": [4, 12, 32], "logo": 45, "look": 48, "low": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38], "lower": 10, "luca": [2, 39, 42], "lucasalegr": 45, "lunar": [5, 45], "lunarland": [5, 25, 26], "m": 38, "machin": 37, "made": [1, 45], "mai": 45, "main": [3, 13, 14, 15, 25, 26], "main_engine_fuel": 5, "make": [1, 4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 45, 46, 47, 48], "mani": [13, 14, 15, 47], "map": [6, 7, 8, 10, 12, 13, 14, 15], "mario": [33, 45], "mark": 45, "markov": 38, "master": 48, "mathieu": [3, 38], "max": 48, "max_r": 48, "max_t": 9, "maxandskipenv": 48, "maxima": 5, "maximum": 38, "maze": 10, "md": [1, 45], "mdp": [42, 43, 45], "mean": 48, "merg": [5, 27, 28, 29, 30], "merge_move_penalti": [27, 28, 29, 30], "method": [45, 46], "metric": 46, "mgoulao": 45, "mike": [3, 10], "min": 48, "min_r": 48, "mine": [13, 14, 15], "mine_config": [13, 14, 15], "minecart": [3, 16, 42, 43, 45], "miner": [11, 12], "minerium": [13, 14, 15], "minim": [13, 14, 15, 16], "minor": 45, "mirror": 12, "mirrored_map": [6, 7, 8], "miss": [41, 45], "mistak": 45, "mo": [2, 3, 5, 13, 14, 15, 16, 36, 40, 41, 42, 43, 44, 46, 47, 48], "mo_gym": [17, 18, 19, 22, 23, 34, 42, 43, 45, 47, 48], "mo_gymnasium": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 45, 46, 47, 48], "mode": [13, 14, 15, 38], "model": [41, 42, 43], "modem": 41, "modifi": 45, "modul": [47, 48], "mofl": 41, "momaxandskipobserv": 45, "momdp": [42, 43, 45], "monormalizereward": 45, "more": [1, 5, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 42, 43], "morecordepisodestatist": 45, "moreov": [46, 47], "morewordstatist": 47, "morl": [3, 6, 7, 8, 9, 42, 43, 45], "most": 47, "mountain": [5, 27, 28, 29, 30, 31, 45], "mountaincar": [5, 31], "mountaincarcontinu": [5, 45], "move": [4, 5, 33, 34, 37, 45, 48], "move_penalti": 5, "much": 33, "mujoco": [42, 44], "multi": [2, 5, 9, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33, 34, 35, 36, 38, 39, 41, 42, 43, 45, 46], "multibinari": 4, "multiobject": 4, "multipl": [4, 37, 40, 41, 45, 46, 47], "must": [12, 13, 14, 15, 16, 46], "my_env_dir": 46, "my_env_fil": 46, "my_env_v0": 46, "myenv": 46, "n": [2, 39, 42], "nO": 38, "narayanan": [12, 37], "ndarrai": 48, "need": 45, "neg": [10, 31, 32], "neighbour": 16, "network": 38, "neural": [38, 39, 42], "neurip": [39, 41, 42], "next": 46, "next_ob": [42, 43, 45], "ninjikin": [4, 37], "nip": 10, "node": 11, "none": [13, 14, 15, 38, 45, 48], "norm": 31, "norm_treasure_env": 48, "normal": [38, 45, 47, 48], "normalized_act": 38, "note": [4, 48], "notebook": [42, 43], "now": [2, 39, 42, 45], "np": [17, 18, 19, 22, 23, 34, 42, 43, 45], "num": 47, "num_env": 47, "number": [4, 38], "numpi": [42, 43, 45, 46], "nutri1": 12, "nutri6": 12, "nutrient": [11, 12], "ob": [5, 12, 16, 36, 42, 43, 45, 47], "object": [2, 5, 9, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33, 34, 35, 36, 38, 39, 41, 42, 43, 45, 46], "observ": [12, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 45, 46, 48], "observation_spac": 46, "observationspac": 45, "obstyp": 48, "off": 45, "oject": 46, "onc": 1, "one": [42, 44, 48], "onli": [38, 48], "open": [41, 42], "opengameart": 38, "optim": [37, 41, 45], "option": [27, 28, 29, 30, 42, 43, 45, 46], "order": 45, "ore1": 16, "ore2": 16, "ores": [13, 14, 15, 16], "org": [38, 42], "orient": [13, 14, 15], "origin": [4, 17, 18, 19, 22, 23, 34, 42, 43, 45], "other": [16, 17, 18, 22, 23, 42, 43, 45, 48], "otherwis": [4, 9, 33], "our": [1, 45, 46], "out": [3, 38], "outcom": 4, "output": 47, "packag": [1, 45], "paper": 4, "pareto": [41, 46], "pareto_front": [45, 46], "parisi": 38, "part": [45, 46], "pass": [33, 45], "passag": 10, "path": [13, 14, 15], "paulina": 38, "penal": 38, "penalti": [4, 5, 6, 7, 8, 12, 27, 28, 29, 30, 31, 33], "peopl": 3, "percentag": 38, "perform": 46, "person": 41, "pf": 45, "pianosi": [16, 38], "pick": 4, "pip": [1, 42, 44], "pixel": [4, 6, 7, 8, 45], "plan": [42, 43], "pleas": [39, 41, 42], "plu": 10, "point": 33, "polici": [37, 41], "porcentag": [13, 14, 15], "port": 38, "posit": [5, 6, 7, 8, 10, 13, 14, 15, 32, 33, 37], "possibl": [4, 32], "potenti": [4, 12, 45], "pp": 38, "practic": [42, 43], "pranav": 5, "pre": 45, "predefin": 45, "prefer": 45, "prevent": 5, "previous": 45, "priorit": 41, "prob_drop": 4, "probabl": [4, 9], "problem": [4, 6, 7, 8, 9, 38, 45], "problemat": [42, 44], "proceed": [2, 37, 39, 42], "process": [39, 42], "product": 48, "project": 3, "protein": [11, 12], "provid": [3, 9, 42, 45, 47], "public": [2, 42], "publish": 41, "pull": [41, 46], "py": 46, "pydoc": 45, "pypi": 45, "pytest": 46, "python": [42, 43, 45], "q": 38, "qld": 38, "qualiti": 45, "quantiti": [13, 14, 15], "question": 3, "r": [1, 47, 48], "r_i": 32, "randint": 45, "random": 38, "rang": [45, 47], "rather": 4, "reach": [3, 6, 7, 8, 10, 11, 12, 16, 27, 28, 29, 30, 31, 33, 45], "reacher": 36, "read": 5, "readm": 45, "readthedoc": 48, "reason": 5, "rebuild": 1, "receiv": [11, 45], "recent": 47, "recov": [17, 18, 19, 22, 23, 34], "red": 10, "refactor": [3, 13, 14, 15], "refer": 46, "registr": 46, "registri": 46, "reinforc": [2, 4, 9, 10, 39, 41, 42, 43, 45], "reinject": 48, "relax": [2, 39, 42], "releas": [16, 38], "reli": 45, "reliabl": [39, 41, 42], "remov": [27, 28, 29, 30], "remove_move_penalti": [27, 28, 29, 30], "renam": 45, "render": [13, 14, 15, 38, 46], "render_mod": [13, 14, 15, 38], "repeat": [13, 14, 15], "repositori": [39, 40, 42, 46], "repres": 45, "request": 41, "requir": 1, "research": [39, 41, 42], "reservoir": [3, 16, 45], "reset": [42, 43, 45, 46, 47, 48], "resourc": [12, 45], "respect": 47, "restelli": 38, "retriev": [13, 14, 15], "return": [9, 13, 14, 15, 37, 42, 45, 46, 48], "return_queu": 47, "revamp": 45, "revers": [4, 5, 27, 28, 29, 30], "reverse_penalti": 5, "reward": [5, 21, 42, 43, 45, 46, 47, 48], "reward_dim": 46, "reward_spac": [45, 46], "reymond": [3, 38], "rgb": [13, 14], "rgb_arrai": [13, 14, 15, 38], "right": [4, 6, 7, 8, 10, 11, 13, 14, 15, 20, 37], "right_lan": 16, "rightest": 16, "riva": 38, "rl": 45, "robert": 4, "rodriguez": 41, "roijer": 12, "room": [3, 12], "root": [11, 45], "run": [19, 24, 35, 46, 47], "runzheyang": 3, "safeti": 4, "same": [6, 7, 8], "sampl": [41, 47], "save": 45, "scalar": [17, 18, 19, 22, 23, 34, 42, 43, 45, 48], "scenario": 45, "sea": [3, 12, 47, 48], "second": [13, 14, 15], "section": 4, "see": [10, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 42, 43, 45, 46], "seed": [46, 47], "select": 38, "self": [45, 46], "sens": 48, "separ": 10, "serenevillagerevamp": [4, 37], "serial": 47, "server": [3, 42], "set": [17, 18, 22, 23, 42, 45, 46], "setup": 45, "shape": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 46, 47], "shaped_reward": 5, "should": [45, 46], "shown": 45, "side": [25, 26], "side_engine_fuel": 5, "signal": 5, "silva": [2, 39, 42], "similar": [36, 47], "similarli": [5, 16], "simon": 38, "simpl": [9, 42, 43], "simpli": 3, "sin": [13, 14, 15, 32], "sinc": [46, 47, 48], "singl": [27, 28, 29, 30, 45], "size": [4, 11, 46], "skip": 48, "sky": 38, "small": [4, 45], "smooth": 48, "snippet": 45, "so": 4, "some": [3, 42, 44, 46], "soto": 41, "sourc": [6, 7, 8, 10, 12, 13, 14, 15, 31, 42], "space": [5, 12, 16, 21, 36, 45, 46], "spars": [13, 14, 15], "specif": 47, "specifi": 4, "speed": [5, 13, 14, 15, 16, 20, 27, 28, 29, 30, 45], "speed_object": 5, "spell": 45, "sphinx": 1, "split": 10, "squar": 10, "srini": 37, "stabil": 48, "stabl": [45, 48], "stable_baselines3": 48, "stai": 16, "standard": [42, 45, 48], "static": 5, "statist": 47, "stats_kei": [47, 48], "steckelmach": [3, 9], "step": [4, 5, 6, 7, 8, 9, 27, 28, 29, 30, 31, 33, 38, 41, 42, 43, 45, 46, 47], "store": 47, "str": [47, 48], "structur": 45, "sub": 47, "submarin": [6, 7, 8, 12], "submiss": 41, "successfulli": [25, 26], "successor": [3, 10], "suit": 42, "super": 33, "supermario": [3, 16], "supermariobro": 33, "supermariobrosenv": 16, "suppli": 38, "support": 16, "swimmer": 36, "swimmerenv": 34, "system": [39, 42, 44], "t": [47, 48], "tailor": 45, "take": [4, 12], "taken": 12, "talbi": [2, 39, 42], "target": 32, "target_1": 36, "target_2": 36, "target_3": 36, "target_4": 36, "target_i": 32, "taxonomi": 41, "termin": [42, 43, 45, 46, 47], "test": 45, "th": 48, "than": 4, "thank": 3, "thei": [45, 47, 48], "them": [3, 4, 5, 42, 43], "therefor": 11, "thi": [1, 4, 39, 42, 43, 44, 45, 46, 47, 48], "those": 10, "three": 12, "threshold": 38, "thrill": 45, "through": 46, "thu": 45, "ti": 46, "time": [1, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 27, 28, 29, 30, 31, 33, 47, 48], "time_limit": 38, "time_penalti": [4, 5, 12], "timemov": 5, "timespe": 5, "tip": 32, "titl": [2, 39, 42], "tomekst": 45, "tool": 45, "toolkit": [39, 41, 42], "top": [27, 28, 29, 30, 31], "torqu": 32, "touch": 48, "track": [47, 48], "trade": 45, "train": 48, "transfer": [3, 10], "transform": 45, "travel": 10, "treasur": [3, 4, 12, 37, 47, 48], "tree": [3, 12, 38], "triangl": 10, "true": [4, 6, 7, 8, 13, 14, 15, 38, 47], "truncat": [38, 42, 43, 45, 46, 47], "tuto": 45, "tutori": 46, "two": [9, 13, 14, 15, 16, 32, 33, 38, 48], "txt": 1, "type": [12, 13, 14, 15, 16, 45], "u": 3, "unbreakable_bottl": 4, "unbreakablebottl": 4, "under": [40, 45], "underwat": [6, 7, 8], "unpin": 45, "until": 38, "unwrap": 45, "up": [4, 6, 7, 8, 10, 37, 38], "updat": 45, "upper": [13, 14, 15], "upstream": 38, "us": [6, 7, 8, 13, 14, 15, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48], "user": 45, "util": [9, 45], "v0": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 21, 27, 28, 29, 30, 31, 33, 36, 37, 38, 42, 43, 47, 48], "v2": [5, 45], "v3": [25, 26], "v4": [17, 18, 19, 22, 23, 24, 32, 34, 35, 36, 45], "valu": [4, 6, 7, 8, 11, 12, 41], "vamplew": [5, 12], "variabl": 47, "variou": [3, 40], "vecenv": 45, "vector": [10, 11, 13, 14, 15, 27, 28, 29, 30, 31, 33, 42, 45, 46, 48], "vector_reward": [42, 43, 45], "vectorenv": 47, "vectori": 45, "vehicl": 16, "veloc": [17, 18, 24, 32, 34, 35, 36], "veri": [42, 43, 46], "version": [5, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 45], "via": [41, 47], "vitamin": [11, 12], "wa": [3, 4, 5, 6, 7, 8, 13, 14, 15, 41, 45], "wai": [3, 10], "walker2d": 36, "walker2denv": 35, "wall": 10, "want": 3, "warn": [16, 45], "water": [3, 11, 12, 16, 45], "we": [3, 42, 45, 46], "websit": [42, 45], "weight": [17, 18, 19, 22, 23, 34, 42, 43, 45, 48], "welfar": 41, "well": [42, 45, 46], "were": 10, "when": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 33, 37, 45, 46], "where": [6, 7, 8, 9, 11, 27, 28, 29, 30, 31, 45], "whether": [13, 14, 15, 38], "which": [4, 5, 6, 7, 8, 9, 10, 42, 45, 46, 47, 48], "while": [4, 10, 12, 16], "within": [45, 46, 47], "wood": [9, 12], "wood_amount": 12, "woodproba": 9, "work": [42, 47], "worker": 45, "workshop": [2, 41], "world": [6, 7, 8], "would": 3, "wrap": [45, 47], "wrapped_env": 47, "wrapper": [40, 42, 43, 45], "wrt": 38, "x": [6, 7, 8, 17, 18, 22, 23, 24, 33, 34, 35, 37], "x_po": 16, "x_veloc": [36, 45], "xu": 36, "y": [6, 7, 8, 17, 18, 37], "y_veloc": 36, "yang": [6, 7, 8, 11, 12, 16], "year": [2, 39, 42], "you": [3, 39, 42, 43, 44, 45, 46], "your": [1, 39, 42], "your_ag": [42, 43, 45], "z": [22, 23], "zero": [32, 45]}, "titles": ["404 - Page Not Found", "MO-Gymnasium documentation", "<no title>", "Community", "Breakable-Bottles", "Classic Control", "Deep-Sea-Treasure", "Deep-Sea-Treasure-Concave", "Deep-Sea-Treasure-Mirrored", "Fishwood", "Four-Room", "Fruit-Tree", "Grid-World", "Minecart", "Minecart-Deterministic", "Minecart-Rgb", "Miscellaneous", "MO-Ant", "MO-Ant-2D", "MO-Halfcheetah", "MO-Highway", "MO-Highway-Fast", "MO-Hopper", "MO-Hopper-2D", "MO-Humanoid", "MO-Lunar-Lander", "MO-Lunar-Lander-Continuous", "MO-Mountaincar", "MO-Mountaincar-3D", "MO-Mountaincar-Timemove", "MO-Mountaincar-Timespeed", "MO-Mountaincarcontinuous", "MO-Reacher", "MO-Supermario", "MO-Swimmer", "MO-Walker2D", "MuJoCo", "Resource-Gathering", "Water-Reservoir", "Citation", "MORL Baselines", "List of Publications", "API", "API", "Install", "Release Notes", "Creating a custom environment", "Vector Wrappers", "Wrappers"], "titleterms": {"0": 45, "1": [45, 46], "2": [45, 46], "29": 45, "2d": [18, 23], "3": [45, 46], "3d": 28, "4": [45, 46], "404": 0, "Not": 0, "The": 0, "acknowledg": 3, "action": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 32, 37, 38], "ant": [17, 18], "api": [42, 43], "argument": [4, 6, 7, 8, 9, 10, 13, 14, 15, 38], "baselin": 40, "becom": 45, "better": 45, "bottl": [4, 45], "breakabl": [4, 45], "bug": 45, "build": 1, "citat": 39, "cite": 42, "class": 46, "classic": 5, "commun": 3, "concav": 7, "continu": 26, "control": 5, "could": 0, "creat": 46, "credit": [4, 6, 7, 8, 9, 10, 13, 14, 15, 37, 38], "custom": 46, "deep": [6, 7, 8, 45], "descript": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 32, 33, 34, 35, 37, 38], "determinist": 14, "document": [1, 45], "environ": [45, 46], "episod": [4, 6, 7, 8, 10, 11, 13, 14, 15, 33, 37], "evalu": 45, "fast": 21, "fishwood": 9, "fix": 45, "found": 0, "four": 10, "front": 45, "fruit": [11, 45], "gather": 37, "grid": 12, "gymnasium": [1, 45], "halfcheetah": 19, "highwai": [20, 21], "hopper": [22, 23], "humanoid": 24, "improv": 45, "instal": [42, 44], "instanti": 46, "known": 45, "lander": [25, 26], "linearreward": 48, "list": 41, "lunar": [25, 26], "matur": 45, "migrat": 45, "minecart": [13, 14, 15], "mirror": [8, 45], "miscellan": 16, "mo": [1, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 45], "moclipreward": 48, "momaxandskipobserv": 48, "monormalizereward": 48, "more": 45, "morecordepisodestatist": [47, 48], "morl": 40, "mosyncvectorenv": 47, "mountaincar": [27, 28, 29, 30], "mountaincarcontinu": 31, "mujoco": [36, 45], "new": [45, 46], "note": 45, "observ": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 32, 37, 38], "page": [0, 45], "pareto": 45, "polici": 45, "public": 41, "pygam": 45, "reacher": [32, 45], "refer": 10, "regist": 46, "releas": 45, "render": 45, "request": 0, "reservoir": 38, "resourc": 37, "reward": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38], "rgb": 15, "room": 10, "sea": [6, 7, 8, 45], "space": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38], "start": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 37, 38], "state": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 37, 38], "supermario": 33, "support": 45, "swimmer": 34, "termin": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 33, 37], "test": 46, "timemov": 29, "timespe": 30, "treasur": [6, 7, 8, 45], "tree": [11, 45], "v0": 45, "v1": 45, "vector": 47, "walker2d": 35, "water": 38, "webpag": 45, "world": 12, "wrapper": [47, 48], "your": 46}}) \ No newline at end of file diff --git a/main/tutorials/custom_env/index.html b/main/tutorials/custom_env/index.html index 9a141d77..5e0ae121 100644 --- a/main/tutorials/custom_env/index.html +++ b/main/tutorials/custom_env/index.html @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -463,7 +465,7 @@

    4. Instantiate your environment + diff --git a/main/wrappers/vector_wrappers/index.html b/main/wrappers/vector_wrappers/index.html new file mode 100644 index 00000000..d0fee156 --- /dev/null +++ b/main/wrappers/vector_wrappers/index.html @@ -0,0 +1,713 @@ + + + + + + + + + + + + + + + Vector Wrappers - MO-Gymnasium Documentation + + + + + + + + + +
    + +
    + + + + + + + + Contents + + + + + + Menu + + + + + + + + Expand + + + + + + Light mode + + + + + + + + + + + + + + Dark mode + + + + + + + Auto light/dark mode + + + + + + + + + + + + + + + + + +
    + + +
    + + + + + +
    +
    +
    + + + + + Back to top + +
    + +
    + +
    +
    + +
    +

    Vector Wrappers

    +

    Similar to the normal wrappers, MO-Gymnasium provides a few wrappers that are specifically designed to work with vectorized environments. They are all available directly from the mo_gymnasium.wrappers.vector module.

    +
    +

    MOSyncVectorEnv

    +
    +
    +class mo_gymnasium.wrappers.vector.MOSyncVectorEnv(env_fns: Iterator[callable], copy: bool = True)
    +

    Vectorized environment that serially runs multiple environments.

    +

    Example

    +
    >>> import mo_gymnasium as mo_gym
    +
    +
    +
    >>> envs = mo_gym.wrappers.vector.MOSyncVectorEnv([
    +...     lambda: mo_gym.make("deep-sea-treasure-v0") for _ in range(4)
    +... ])
    +>>> envs
    +MOSyncVectorEnv(num_envs=4)
    +>>> obs, infos = envs.reset()
    +>>> obs
    +array([[0, 0], [0, 0], [0, 0], [0, 0]], dtype=int32)
    +>>> _ = envs.action_space.seed(42)
    +>>> actions = envs.action_space.sample()
    +>>> obs, rewards, terminateds, truncateds, infos = envs.step([0, 1, 2, 3])
    +>>> obs
    +array([[0, 0], [1, 0], [0, 0], [0, 3]], dtype=int32)
    +>>> rewards
    +array([[0., -1.], [0.7, -1.], [0., -1.], [0., -1.]], dtype=float32)
    +>>> terminateds
    +array([False,  True, False, False])
    +
    +
    +
    + +
    +
    +

    MORecordEpisodeStatistics

    +
    +
    +class mo_gymnasium.wrappers.vector.MORecordEpisodeStatistics(env: VectorEnv, gamma: float = 1.0, buffer_length: int = 100, stats_key: str = 'episode')
    +

    This wrapper will keep track of cumulative rewards and episode lengths.

    +

    At the end of any episode within the vectorized env, the statistics of the episode +will be added to info using the key episode, and the _episode key +is used to indicate the environment index which has a terminated or truncated episode.

    +
    +

    For a vectorized environments the output will be in the form of (be careful to first wrap the env into vector before applying MORewordStatistics):

    +
    >>> infos = { 
    +...     "episode": {
    +...         "r": "<array of cumulative reward for each done sub-environment (2d array, shape (num_envs, dim_reward))>",
    +...         "dr": "<array of discounted reward for each done sub-environment (2d array, shape (num_envs, dim_reward))>",
    +...         "l": "<array of episode length for each done sub-environment (array)>",
    +...         "t": "<array of elapsed time since beginning of episode for each done sub-environment (array)>"
    +...     },
    +...     "_episode": "<boolean array of length num-envs>"
    +... }
    +
    +
    +
    +

    Moreover, the most recent rewards and episode lengths are stored in buffers that can be accessed via +wrapped_env.return_queue and wrapped_env.length_queue respectively.

    +
    +
    Variables:
    +
      +
    • return_queue – The cumulative rewards of the last deque_size-many episodes

    • +
    • length_queue – The lengths of the last deque_size-many episodes

    • +
    +
    +
    +
    + +
    +
    + +
    +
    + +
    + +
    +
    +
    + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/main/wrappers/wrappers/index.html b/main/wrappers/wrappers/index.html index 495cb95c..22a8655f 100644 --- a/main/wrappers/wrappers/index.html +++ b/main/wrappers/wrappers/index.html @@ -8,7 +8,7 @@ - + @@ -215,6 +215,7 @@
  • Install
  • API
  • Wrappers
  • +
  • Vector Wrappers
  • MORL Baselines
  • Environments

    @@ -252,6 +253,7 @@
  • MO-Halfcheetah
  • MO-Walker2D
  • MO-Ant
  • +
  • MO-Swimmer
  • MO-Humanoid
  • @@ -329,12 +331,12 @@

    Wrappers

    -

    A few wrappers inspired from Gymnasium’s wrappers are available in MO-Gymnasium. They are all available directly from the mo_gymnasium module.

    +

    A few wrappers inspired from Gymnasium’s wrappers are available in MO-Gymnasium. They are all available directly from the mo_gymnasium.wrappers module.

    LinearReward

    -
    -class mo_gymnasium.LinearReward(env: Env, weight: ndarray | None = None)
    +
    +class mo_gymnasium.wrappers.LinearReward(env: Env, weight: ndarray | None = None)

    Makes the env return a scalar reward, which is the dot-product between the reward vector and the weight vector.

    @@ -342,63 +344,59 @@

    LinearReward

    MONormalizeReward

    -
    -class mo_gymnasium.MONormalizeReward(env: Env, idx: int, gamma: float = 0.99, epsilon: float = 1e-08)
    +
    +class mo_gymnasium.wrappers.MONormalizeReward(env: Env, idx: int, gamma: float = 0.99, epsilon: float = 1e-08)

    Wrapper to normalize the reward component at index idx. Does not touch other reward components.

    +

    This code is heavily inspired on Gymnasium’s except that it extracts the reward component at given idx, normalizes it, and reinjects it.

    +

    (!) This smoothes the moving average of the reward, which can be useful for training stability. But it does not “normalize” the reward in the sense of making it have a mean of 0 and a standard deviation of 1.

    +

    Example

    +
    >>> import mo_gymnasium as mo_gym
    +>>> from mo_gymnasium.wrappers import MONormalizeReward
    +>>> env = mo_gym.make("deep-sea-treasure-v0")
    +>>> norm_treasure_env = MONormalizeReward(env, idx=0)
    +>>> both_norm_env = MONormalizeReward(norm_treasure_env, idx=1)
    +>>> both_norm_env.reset() # This one normalizes both rewards
    +
    +

    MOClipReward

    -
    -class mo_gymnasium.MOClipReward(env: Env, idx: int, min_r, max_r)
    +
    +class mo_gymnasium.wrappers.MOClipReward(env: Env, idx: int, min_r, max_r)

    Clip reward[idx] to [min, max].

    -
    -
    -

    MOSyncVectorEnv

    -
    -
    -class mo_gymnasium.MOSyncVectorEnv(env_fns: Iterator[callable], copy: bool = True)
    -

    Vectorized environment that serially runs multiple environments.

    -
    -

    MORecordEpisodeStatistics

    -
    -class mo_gymnasium.MORecordEpisodeStatistics(env: Env, gamma: float = 1.0, deque_size: int = 100)
    +
    +class mo_gymnasium.wrappers.MORecordEpisodeStatistics(env: Env, gamma: float = 1.0, buffer_length: int = 100, stats_key: str = 'episode')

    This wrapper will keep track of cumulative rewards and episode lengths.

    After the completion of an episode, info will look like this:

    >>> info = {
     ...     "episode": {
     ...         "r": "<cumulative reward (array)>",
     ...         "dr": "<discounted reward (array)>",
    -...         "l": "<episode length (scalar)>", # contrary to Gymnasium, these are not a numpy array
    +...         "l": "<episode length (scalar)>",
     ...         "t": "<elapsed time since beginning of episode (scalar)>"
     ...     },
     ... }
     
    -

    For a vectorized environments the output will be in the form of (be careful to first wrap the env into vector before applying MORewordStatistics):

    -
    >>> infos = {
    -...     "final_observation": "<array of length num-envs>",
    -...     "_final_observation": "<boolean array of length num-envs>",
    -...     "final_info": "<array of length num-envs>",
    -...     "_final_info": "<boolean array of length num-envs>",
    -...     "episode": {
    -...         "r": "<array of cumulative reward (2d array, shape (num_envs, dim_reward))>",
    -...         "dr": "<array of discounted reward (2d array, shape (num_envs, dim_reward))>",
    -...         "l": "<array of episode length (array)>",
    -...         "t": "<array of elapsed time since beginning of episode (array)>"
    -...     },
    -...     "_episode": "<boolean array of length num-envs>"
    -... }
    -
    -
    +
    + +
    +
    +

    MOMaxAndSkipObservation

    +
    +
    +class mo_gymnasium.wrappers.MOMaxAndSkipObservation(env: Env[ObsType, ActType], skip: int = 4)
    +

    This wrapper will return only every skip-th frame (frameskipping) and return the max between the two last observations.

    +

    Note: This wrapper is based on the wrapper from stable-baselines3: https://stable-baselines3.readthedocs.io/en/master/_modules/stable_baselines3/common/atari_wrappers.html#MaxAndSkipEnv

    @@ -409,12 +407,12 @@

    MORecordEpisode