From 274b7439c08ffd26a9fdda25c3a538bff99e0138 Mon Sep 17 00:00:00 2001 From: LucasAlegre Date: Mon, 28 Oct 2024 15:33:45 +0000 Subject: [PATCH] =?UTF-8?q?Deploying=20to=20gh-pages=20from=20@=20Farama-F?= =?UTF-8?q?oundation/MO-Gymnasium@3b1b030b9743f217fab614d16903d139eceaab52?= =?UTF-8?q?=20=F0=9F=9A=80?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- .buildinfo | 2 +- 404.html | 3 +- README/index.html | 3 +- _static/documentation_options.js | 2 +- citing/citing/index.html | 3 +- community/community/index.html | 3 +- environments/breakable-bottles/index.html | 3 +- environments/classical/index.html | 3 +- .../deep-sea-treasure-concave/index.html | 3 +- .../deep-sea-treasure-mirrored/index.html | 3 +- environments/deep-sea-treasure/index.html | 3 +- environments/fishwood/index.html | 3 +- environments/four-room/index.html | 3 +- environments/fruit-tree/index.html | 3 +- environments/grid-world/index.html | 3 +- .../minecart-deterministic/index.html | 3 +- environments/minecart-rgb/index.html | 3 +- environments/minecart/index.html | 3 +- environments/misc/index.html | 3 +- environments/mo-ant-2d/index.html | 3 +- environments/mo-ant-2obj/index.html | 677 ++++++++++++++++++ environments/mo-ant/index.html | 36 +- environments/mo-halfcheetah/index.html | 19 +- environments/mo-highway-fast/index.html | 3 +- environments/mo-highway/index.html | 3 +- environments/mo-hopper-2d/index.html | 3 +- environments/mo-hopper-2obj/index.html | 675 +++++++++++++++++ environments/mo-hopper/index.html | 35 +- environments/mo-humanoid/index.html | 18 +- .../mo-lunar-lander-continuous/index.html | 3 +- environments/mo-lunar-lander/index.html | 3 +- environments/mo-mountaincar-3d/index.html | 3 +- .../mo-mountaincar-timemove/index.html | 3 +- .../mo-mountaincar-timespeed/index.html | 3 +- environments/mo-mountaincar/index.html | 3 +- .../mo-mountaincarcontinuous/index.html | 3 +- environments/mo-reacher/index.html | 26 +- environments/mo-supermario/index.html | 3 +- environments/mo-swimmer/index.html | 28 +- environments/mo-walker2d/index.html | 15 +- environments/mujoco/index.html | 3 +- environments/resource-gathering/index.html | 3 +- environments/water-reservoir/index.html | 3 +- examples/citation/index.html | 3 +- examples/morl_baselines/index.html | 3 +- examples/publications/index.html | 3 +- genindex/index.html | 3 +- index.html | 3 +- introduction/api/index.html | 3 +- introduction/install/index.html | 3 +- objects.inv | Bin 1521 -> 1559 bytes release_notes/index.html | 27 +- search/index.html | 3 +- searchindex.js | 2 +- tutorials/custom_env/index.html | 3 +- wrappers/vector_wrappers/index.html | 3 +- wrappers/wrappers/index.html | 3 +- 57 files changed, 1607 insertions(+), 84 deletions(-) create mode 100644 environments/mo-ant-2obj/index.html create mode 100644 environments/mo-hopper-2obj/index.html diff --git a/.buildinfo b/.buildinfo index 055f7d2..fb2539f 100644 --- a/.buildinfo +++ b/.buildinfo @@ -1,4 +1,4 @@ # Sphinx build info version 1 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done. -config: 9e28e034788f88155ad752a56985e689 +config: 029408ec80ac705c56ad18ad01221a7f tags: d77d1c0d9ca2f4c8421862c7c5a0d620 diff --git a/404.html b/404.html index a34feb5..92acacc 100644 --- a/404.html +++ b/404.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -419,7 +420,7 @@

    The requested page could not be found. + diff --git a/README/index.html b/README/index.html index 7fb6c10..4ddc209 100644 --- a/README/index.html +++ b/README/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -436,7 +437,7 @@

    Build the Documentation + diff --git a/_static/documentation_options.js b/_static/documentation_options.js index 5981673..dc28e0c 100644 --- a/_static/documentation_options.js +++ b/_static/documentation_options.js @@ -1,5 +1,5 @@ const DOCUMENTATION_OPTIONS = { - VERSION: '1.2.0', + VERSION: '1.3.0', LANGUAGE: 'en', COLLAPSE_INDEX: false, BUILDER: 'dirhtml', diff --git a/citing/citing/index.html b/citing/citing/index.html index 587905c..a1789a3 100644 --- a/citing/citing/index.html +++ b/citing/citing/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -405,7 +406,7 @@ - + diff --git a/community/community/index.html b/community/community/index.html index c1a5ea8..12b32b2 100644 --- a/community/community/index.html +++ b/community/community/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -450,7 +451,7 @@

    Acknowledgements + diff --git a/environments/breakable-bottles/index.html b/environments/breakable-bottles/index.html index d65bffb..06cb051 100644 --- a/environments/breakable-bottles/index.html +++ b/environments/breakable-bottles/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -519,7 +520,7 @@

    Credits¶ - + diff --git a/environments/classical/index.html b/environments/classical/index.html index 0cf2ce8..76762eb 100644 --- a/environments/classical/index.html +++ b/environments/classical/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -468,7 +469,7 @@

    Classic Control + diff --git a/environments/deep-sea-treasure-concave/index.html b/environments/deep-sea-treasure-concave/index.html index b9dc38b..1cb2fd0 100644 --- a/environments/deep-sea-treasure-concave/index.html +++ b/environments/deep-sea-treasure-concave/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -522,7 +523,7 @@

    Credits¶ - + diff --git a/environments/deep-sea-treasure-mirrored/index.html b/environments/deep-sea-treasure-mirrored/index.html index 4ff35b4..0e7f548 100644 --- a/environments/deep-sea-treasure-mirrored/index.html +++ b/environments/deep-sea-treasure-mirrored/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -512,7 +513,7 @@

    Credits¶ - + diff --git a/environments/deep-sea-treasure/index.html b/environments/deep-sea-treasure/index.html index 37335e5..1c66104 100644 --- a/environments/deep-sea-treasure/index.html +++ b/environments/deep-sea-treasure/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -510,7 +511,7 @@

    Credits¶ - + diff --git a/environments/fishwood/index.html b/environments/fishwood/index.html index 389cffc..a9b6b35 100644 --- a/environments/fishwood/index.html +++ b/environments/fishwood/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -507,7 +508,7 @@

    Credits¶ - + diff --git a/environments/four-room/index.html b/environments/four-room/index.html index 19e8738..86cd45a 100644 --- a/environments/four-room/index.html +++ b/environments/four-room/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -509,7 +510,7 @@

    Credits¶ - + diff --git a/environments/fruit-tree/index.html b/environments/fruit-tree/index.html index 413e636..7680a77 100644 --- a/environments/fruit-tree/index.html +++ b/environments/fruit-tree/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -486,7 +487,7 @@

    Episode Termination + diff --git a/environments/grid-world/index.html b/environments/grid-world/index.html index 4a1e46d..a0f3918 100644 --- a/environments/grid-world/index.html +++ b/environments/grid-world/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -475,7 +476,7 @@

    Grid-World + diff --git a/environments/minecart-deterministic/index.html b/environments/minecart-deterministic/index.html index 4b86558..c6555ae 100644 --- a/environments/minecart-deterministic/index.html +++ b/environments/minecart-deterministic/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -534,7 +535,7 @@

    Credits¶ - + diff --git a/environments/minecart-rgb/index.html b/environments/minecart-rgb/index.html index 31fc55a..285bca3 100644 --- a/environments/minecart-rgb/index.html +++ b/environments/minecart-rgb/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -524,7 +525,7 @@

    Credits¶ - + diff --git a/environments/minecart/index.html b/environments/minecart/index.html index 96e1627..f5e5c6a 100644 --- a/environments/minecart/index.html +++ b/environments/minecart/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -522,7 +523,7 @@

    Credits¶ - + diff --git a/environments/misc/index.html b/environments/misc/index.html index 0663678..0421b6f 100644 --- a/environments/misc/index.html +++ b/environments/misc/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -455,7 +456,7 @@

    Miscellaneous + diff --git a/environments/mo-ant-2d/index.html b/environments/mo-ant-2d/index.html index 6211659..ba0c002 100644 --- a/environments/mo-ant-2d/index.html +++ b/environments/mo-ant-2d/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -466,7 +467,7 @@

    Reward Space + diff --git a/environments/mo-ant-2obj/index.html b/environments/mo-ant-2obj/index.html new file mode 100644 index 0000000..f929f54 --- /dev/null +++ b/environments/mo-ant-2obj/index.html @@ -0,0 +1,677 @@ + + + + + + + + + + + + + + + MO-Ant-2Obj - MO-Gymnasium Documentation + + + + + + + + + +
    + +
    + + + + + + + + Contents + + + + + + Menu + + + + + + + + Expand + + + + + + Light mode + + + + + + + + + + + + + + Dark mode + + + + + + + Auto light/dark mode + + + + + + + + + + + + + + + + + +
    + + +
    + + + + + +
    +
    +
    + + + + + Back to top + +
    + +
    + +
    +
    + +
    +

    MO-Ant-2Obj

    +
    +_static/videos/mo-ant-2obj.gif + +
    +
    + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +

    Action Space

    Box(-1.0, 1.0, (8,), float32)

    Observation Shape

    (105,)

    Observation High

    inf

    Observation Low

    -inf

    Reward Shape

    (2,)

    Reward High

    [inf inf]

    Reward Low

    [-inf -inf]

    Import

    mo_gymnasium.make("mo-ant-2obj-v5")

    +
    +
    +

    Description

    +

    Multi-objective version of the AntEnv environment.

    +

    See Gymnasium’s env for more information.

    +

    The original Gymnasium’s ‘Ant-v5’ is recovered by the following linear scalarization:

    +

    env = mo_gym.make(‘mo-ant-v4’, cost_objective=False) +LinearReward(env, weight=np.array([1.0, 0.0]))

    +
    +
    +

    Reward Space

    +

    The reward is 2- or 3-dimensional:

    +
      +
    • 0: x-velocity

    • +
    • 1: y-velocity

    • +
    • 2: Control cost of the action +If the cost_objective flag is set to False, the reward is 2-dimensional, and the cost is added to other objectives. +A healthy reward and a cost for contact forces is added to all objectives.

    • +
    +

    A 2-objective version (without the cost objective as a separate objective) can be instantiated via: +env = mo_gym.make(‘mo-ant-2obj-v5’)

    +
    +
    +

    Version History

    +
      +
    • v5: Now includes contact forces in the reward and observation. +The 2-objective version has now id ‘mo-ant-2obj-v5’, instead of ‘mo-ant-2d-v4’. +See https://gymnasium.farama.org/environments/mujoco/ant/#version-history

    • +
    +
    +
    + +
    +
    +
    + + +
    +
    + + +
    +
    + +
    +
    + +
    +
    + +
    +
    +
    + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/environments/mo-ant/index.html b/environments/mo-ant/index.html index ad0566e..03d56f3 100644 --- a/environments/mo-ant/index.html +++ b/environments/mo-ant/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -338,7 +339,7 @@

    MO-Ant

    Box(-1.0, 1.0, (8,), float32)

    Observation Shape

    -

    (27,)

    +

    (105,)

    Observation High

    inf

    @@ -356,7 +357,7 @@

    MO-Ant

    [-inf -inf -inf]

    Import

    -

    mo_gymnasium.make("mo-ant-v4")

    +

    mo_gymnasium.make("mo-ant-v5")

    @@ -365,7 +366,7 @@

    MO-AntDescription

    Multi-objective version of the AntEnv environment.

    See Gymnasium’s env for more information.

    -

    The original Gymnasium’s ‘Ant-v4’ is recovered by the following linear scalarization:

    +

    The original Gymnasium’s ‘Ant-v5’ is recovered by the following linear scalarization:

    env = mo_gym.make(‘mo-ant-v4’, cost_objective=False) LinearReward(env, weight=np.array([1.0, 0.0]))

    @@ -377,7 +378,17 @@

    Reward Space +

    Version History

    +
      +
    • v5: Now includes contact forces in the reward and observation. +The 2-objective version has now id ‘mo-ant-2obj-v5’, instead of ‘mo-ant-2d-v4’. +See https://gymnasium.farama.org/environments/mujoco/ant/#version-history

    @@ -398,7 +409,19 @@

    Reward Space - + + + + +
    +
    + Previous +
    + +
    MO-Walker2D
    + +
    +
    @@ -442,6 +465,7 @@

    Reward SpaceMO-Ant @@ -476,7 +500,7 @@

    Reward Space + diff --git a/environments/mo-halfcheetah/index.html b/environments/mo-halfcheetah/index.html index db2807c..bd89879 100644 --- a/environments/mo-halfcheetah/index.html +++ b/environments/mo-halfcheetah/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -356,7 +357,7 @@

    MO-Halfcheetah

    Import

    -

    mo_gymnasium.make("mo-halfcheetah-v4")

    +

    mo_gymnasium.make("mo-halfcheetah-v5")

    @@ -365,9 +366,9 @@

    MO-Halfcheetah

    Multi-objective version of the HalfCheetahEnv environment.

    See Gymnasium’s env for more information.

    -

    The original Gymnasium’s ‘HalfCheetah-v4’ is recovered by the following linear scalarization:

    -

    env = mo_gym.make(‘mo-halfcheetah-v4’) -LinearReward(env, weight=np.array([1.0, 1.0]))

    +

    The original Gymnasium’s ‘HalfCheetah-v5’ is recovered by the following linear scalarization:

    +

    env = mo_gym.make(‘mo-halfcheetah-v5’) +LinearReward(env, weight=np.array([1.0, 0.1]))

    Reward Space

    @@ -377,6 +378,13 @@

    Reward Space +

    Version History

    +
      +
    • v5: The scales of the control cost has changed from v4. +See https://gymnasium.farama.org/environments/mujoco/half_cheetah/#version-history for other changes.

    • +
    +

    @@ -441,6 +449,7 @@

    Reward SpaceMO-Halfcheetah @@ -475,7 +484,7 @@

    Reward Space + diff --git a/environments/mo-highway-fast/index.html b/environments/mo-highway-fast/index.html index b1e48a0..4d02af1 100644 --- a/environments/mo-highway-fast/index.html +++ b/environments/mo-highway-fast/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -428,7 +429,7 @@

    MO-Highway-Fast + diff --git a/environments/mo-highway/index.html b/environments/mo-highway/index.html index 19c60fd..22d8530 100644 --- a/environments/mo-highway/index.html +++ b/environments/mo-highway/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -471,7 +472,7 @@

    Reward Space + diff --git a/environments/mo-hopper-2d/index.html b/environments/mo-hopper-2d/index.html index 3377ff9..d8e8ae7 100644 --- a/environments/mo-hopper-2d/index.html +++ b/environments/mo-hopper-2d/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -465,7 +466,7 @@

    Reward Space + diff --git a/environments/mo-hopper-2obj/index.html b/environments/mo-hopper-2obj/index.html new file mode 100644 index 0000000..0d324df --- /dev/null +++ b/environments/mo-hopper-2obj/index.html @@ -0,0 +1,675 @@ + + + + + + + + + + + + + + + MO-Hopper-2Obj - MO-Gymnasium Documentation + + + + + + + + + +
    + +
    + + + + + + + + Contents + + + + + + Menu + + + + + + + + Expand + + + + + + Light mode + + + + + + + + + + + + + + Dark mode + + + + + + + Auto light/dark mode + + + + + + + + + + + + + + + + + +
    + + +
    + + + + + +
    +
    +
    + + + + + Back to top + +
    + +
    + +
    +
    + +
    +

    MO-Hopper-2Obj

    +
    +_static/videos/mo-hopper-2obj.gif + +
    +
    + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + + +

    Action Space

    Box(-1.0, 1.0, (3,), float32)

    Observation Shape

    (11,)

    Observation High

    inf

    Observation Low

    -inf

    Reward Shape

    (2,)

    Reward High

    [inf inf]

    Reward Low

    [-inf -inf]

    Import

    mo_gymnasium.make("mo-hopper-2obj-v5")

    +
    +
    +

    Description

    +

    Multi-objective version of the HopperEnv environment.

    +

    See Gymnasium’s env for more information.

    +

    The original Gymnasium’s ‘Hopper-v5’ is recovered by the following linear scalarization:

    +

    env = mo_gym.make(‘mo-hopper-v5’) +LinearReward(env, weight=np.array([1.0, 0.0, 1e-3]))

    +
    +
    +

    Reward Space

    +

    The reward is 3-dimensional:

    +
      +
    • 0: Reward for going forward on the x-axis

    • +
    • 1: Reward for jumping high on the z-axis

    • +
    • 2: Control cost of the action +If the cost_objective flag is set to False, the reward is 2-dimensional, and the cost is added to other objectives.

    • +
    +

    A 2-objective version (without the cost objective as a separate objective) can be instantiated via: +env = mo_gym.make(‘mo-hopper-2obj-v5’)

    +
    +
    +

    Version History

    +
      +
    • v5: The 2-objective version has now id ‘mo-hopper-2obj-v5’, instead of ‘mo-hopper-2d-v4’. +See https://gymnasium.farama.org/environments/mujoco/hopper/#version-history

    • +
    +
    +
    + +
    +
    +
    + + +
    +
    + + +
    +
    + +
    +
    + +
    +
    + +
    +
    +
    + + + + + + + + + + + + + + + + + \ No newline at end of file diff --git a/environments/mo-hopper/index.html b/environments/mo-hopper/index.html index 1fb3f2d..5c5b75c 100644 --- a/environments/mo-hopper/index.html +++ b/environments/mo-hopper/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -356,7 +357,7 @@

    MO-Hopper

    Import

    -

    mo_gymnasium.make("mo-hopper-v4")

    +

    mo_gymnasium.make("mo-hopper-v5")

    @@ -365,9 +366,9 @@

    MO-Hopper

    Multi-objective version of the HopperEnv environment.

    See Gymnasium’s env for more information.

    -

    The original Gymnasium’s ‘Hopper-v4’ is recovered by the following linear scalarization:

    -

    env = mo_gym.make(‘mo-hopper-v4’, cost_objective=False) -LinearReward(env, weight=np.array([1.0, 0.0]))

    +

    The original Gymnasium’s ‘Hopper-v5’ is recovered by the following linear scalarization:

    +

    env = mo_gym.make(‘mo-hopper-v5’) +LinearReward(env, weight=np.array([1.0, 0.0, 1e-3]))

    Reward Space

    @@ -378,6 +379,15 @@

    Reward Space +

    Version History

    +
      +
    • v5: The 2-objective version has now id ‘mo-hopper-2obj-v5’, instead of ‘mo-hopper-2d-v4’. +See https://gymnasium.farama.org/environments/mujoco/hopper/#version-history

    • +

    @@ -397,7 +407,19 @@

    Reward Space - + + + + +
    +
    + Previous +
    + +
    MO-Reacher
    + +
    +

    @@ -441,6 +463,7 @@

    Reward SpaceMO-Hopper @@ -475,7 +498,7 @@

    Reward Space + diff --git a/environments/mo-humanoid/index.html b/environments/mo-humanoid/index.html index a73342a..2944daa 100644 --- a/environments/mo-humanoid/index.html +++ b/environments/mo-humanoid/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -338,7 +339,7 @@

    MO-Humanoid

    Observation Shape

    -

    (376,)

    +

    (348,)

    Observation High

    inf

    @@ -356,7 +357,7 @@

    MO-Humanoid

    Import

    -

    mo_gymnasium.make("mo-humanoid-v4")

    +

    mo_gymnasium.make("mo-humanoid-v5")

    @@ -365,6 +366,9 @@

    MO-Humanoid

    Multi-objective version of the HumanoidEnv environment.

    See Gymnasium’s env for more information.

    +

    The original Gymnasium’s ‘Humanoid-v5’ is recovered by the following linear scalarization:

    +

    env = mo_gym.make(‘mo-humanoid-v5’) +LinearReward(env, weight=np.array([1.25, 0.1]))

    Reward Space

    @@ -374,6 +378,13 @@

    Reward Space +

    Version History:

    +
      +
    • v5: Now includes contact forces. See: https://gymnasium.farama.org/environments/mujoco/humanoid/#version-history +The scales of the control cost has changed from v4.

    • +
    +

    @@ -438,6 +449,7 @@

    Reward SpaceMO-Humanoid @@ -472,7 +484,7 @@

    Reward Space + diff --git a/environments/mo-lunar-lander-continuous/index.html b/environments/mo-lunar-lander-continuous/index.html index eb96dae..710f1f4 100644 --- a/environments/mo-lunar-lander-continuous/index.html +++ b/environments/mo-lunar-lander-continuous/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -474,7 +475,7 @@

    Reward Space + diff --git a/environments/mo-lunar-lander/index.html b/environments/mo-lunar-lander/index.html index dd0b7dd..308e0a5 100644 --- a/environments/mo-lunar-lander/index.html +++ b/environments/mo-lunar-lander/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -472,7 +473,7 @@

    Reward Space + diff --git a/environments/mo-mountaincar-3d/index.html b/environments/mo-mountaincar-3d/index.html index 35045fa..f8cec88 100644 --- a/environments/mo-mountaincar-3d/index.html +++ b/environments/mo-mountaincar-3d/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -463,7 +464,7 @@

    Reward space: + diff --git a/environments/mo-mountaincar-timemove/index.html b/environments/mo-mountaincar-timemove/index.html index 8e9b9c9..791f86f 100644 --- a/environments/mo-mountaincar-timemove/index.html +++ b/environments/mo-mountaincar-timemove/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -463,7 +464,7 @@

    Reward space: + diff --git a/environments/mo-mountaincar-timespeed/index.html b/environments/mo-mountaincar-timespeed/index.html index cb08889..ff92d62 100644 --- a/environments/mo-mountaincar-timespeed/index.html +++ b/environments/mo-mountaincar-timespeed/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -463,7 +464,7 @@

    Reward space: + diff --git a/environments/mo-mountaincar/index.html b/environments/mo-mountaincar/index.html index 21fefc4..f19bb1c 100644 --- a/environments/mo-mountaincar/index.html +++ b/environments/mo-mountaincar/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -473,7 +474,7 @@

    Reward space: + diff --git a/environments/mo-mountaincarcontinuous/index.html b/environments/mo-mountaincarcontinuous/index.html index 0132d20..84cf0d7 100644 --- a/environments/mo-mountaincarcontinuous/index.html +++ b/environments/mo-mountaincarcontinuous/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -466,7 +467,7 @@

    Reward space: + diff --git a/environments/mo-reacher/index.html b/environments/mo-reacher/index.html index de4bd00..537aad4 100644 --- a/environments/mo-reacher/index.html +++ b/environments/mo-reacher/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -356,7 +357,7 @@

    MO-Reacher

    Import

    -

    mo_gymnasium.make("mo-reacher-v4")

    +

    mo_gymnasium.make("mo-reacher-v5")

    @@ -385,6 +386,10 @@

    Reward Space +

    Version History:

    +

    See https://gymnasium.farama.org/environments/mujoco/reacher/#version-history

    + @@ -392,18 +397,20 @@

    Reward Space - + + + + +
    - Next + Previous
    -
    MO-Hopper
    + +
    MuJoCo
    +
    - - -
    -

    @@ -449,6 +456,7 @@

    Reward SpaceObservation Space
  • Action Space
  • Reward Space
  • +
  • Version History:
  • @@ -483,7 +491,7 @@

    Reward Space + diff --git a/environments/mo-supermario/index.html b/environments/mo-supermario/index.html index ea4a18a..7371202 100644 --- a/environments/mo-supermario/index.html +++ b/environments/mo-supermario/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -478,7 +479,7 @@

    Episode Termination + diff --git a/environments/mo-swimmer/index.html b/environments/mo-swimmer/index.html index 4880977..f9c36eb 100644 --- a/environments/mo-swimmer/index.html +++ b/environments/mo-swimmer/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -356,7 +357,7 @@

    MO-Swimmer

    Import

    -

    mo_gymnasium.make("mo-swimmer-v4")

    +

    mo_gymnasium.make("mo-swimmer-v5")

    @@ -365,8 +366,8 @@

    MO-Swimmer

    Multi-objective version of the SwimmerEnv environment.

    See Gymnasium’s env for more information.

    -

    The original Gymnasium’s ‘Swimmer-v4’ is recovered by the following linear scalarization:

    -

    env = mo_gym.make(‘mo-swimmer-v4’) +

    The original Gymnasium’s ‘Swimmer-v5’ is recovered by the following linear scalarization:

    +

    env = mo_gym.make(‘mo-swimmer-v5’) LinearReward(env, weight=np.array([1.0, 1e-4]))

    @@ -377,6 +378,10 @@

    Reward Space +

    Version History:

    +

    See https://gymnasium.farama.org/main/environments/mujoco/swimmer/#version-history

    +

    @@ -395,7 +400,19 @@

    Reward Space - + + + + +
    +
    + Previous +
    + +
    MO-Ant
    + +
    +

    @@ -439,6 +456,7 @@

    Reward SpaceMO-Swimmer @@ -473,7 +491,7 @@

    Reward Space + diff --git a/environments/mo-walker2d/index.html b/environments/mo-walker2d/index.html index 8c390df..9d98aca 100644 --- a/environments/mo-walker2d/index.html +++ b/environments/mo-walker2d/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -356,7 +357,7 @@

    MO-Walker2D

    Import

    -

    mo_gymnasium.make("mo-walker2d-v4")

    +

    mo_gymnasium.make("mo-walker2d-v5")

    @@ -365,6 +366,9 @@

    MO-Walker2D

    Multi-objective version of the Walker2dEnv environment.

    See Gymnasium’s env for more information.

    +

    The original Gymnasium’s ‘Walker2d-v5’ is recovered by the following linear scalarization:

    +

    env = mo_gym.make(‘mo-walker2d-v5’) +LinearReward(env, weight=np.array([1.0, 1e-3]))

    Reward Space

    @@ -374,6 +378,12 @@

    Reward Space +

    Version History

    +
      +
    • See https://gymnasium.farama.org/main/environments/mujoco/walker2d/#version-history

    • +

    @@ -440,6 +450,7 @@

    Reward SpaceReward Space +
  • Version History
  • @@ -472,7 +483,7 @@

    Reward Space + diff --git a/environments/mujoco/index.html b/environments/mujoco/index.html index 40c4e4a..c795081 100644 --- a/environments/mujoco/index.html +++ b/environments/mujoco/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -470,7 +471,7 @@

    MuJoCo + diff --git a/environments/resource-gathering/index.html b/environments/resource-gathering/index.html index 1128964..bd862cf 100644 --- a/environments/resource-gathering/index.html +++ b/environments/resource-gathering/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -509,7 +510,7 @@

    Credits¶ - + diff --git a/environments/water-reservoir/index.html b/environments/water-reservoir/index.html index 1168e99..de9fac5 100644 --- a/environments/water-reservoir/index.html +++ b/environments/water-reservoir/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -513,7 +514,7 @@

    Credits¶ - + diff --git a/examples/citation/index.html b/examples/citation/index.html index 89d6c0c..4a9118f 100644 --- a/examples/citation/index.html +++ b/examples/citation/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -416,7 +417,7 @@

    Citation - + diff --git a/examples/morl_baselines/index.html b/examples/morl_baselines/index.html index f52abf0..ef3ddc1 100644 --- a/examples/morl_baselines/index.html +++ b/examples/morl_baselines/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -420,7 +421,7 @@

    MORL Baselines + diff --git a/examples/publications/index.html b/examples/publications/index.html index 0430579..5b6ffb0 100644 --- a/examples/publications/index.html +++ b/examples/publications/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -424,7 +425,7 @@

    List of Publications + diff --git a/genindex/index.html b/genindex/index.html index 2a922f0..a82e40f 100644 --- a/genindex/index.html +++ b/genindex/index.html @@ -250,6 +250,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -422,7 +423,7 @@

    M

    - + diff --git a/index.html b/index.html index 6b7864c..1a674fe 100644 --- a/index.html +++ b/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -459,7 +460,7 @@

    Citing + diff --git a/introduction/api/index.html b/introduction/api/index.html index 91ab426..a31b0d6 100644 --- a/introduction/api/index.html +++ b/introduction/api/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -425,7 +426,7 @@

    API

    + diff --git a/introduction/install/index.html b/introduction/install/index.html index d09f6d3..841d5fc 100644 --- a/introduction/install/index.html +++ b/introduction/install/index.html @@ -252,6 +252,7 @@
  • MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -412,7 +413,7 @@

    Install¶ - + diff --git a/objects.inv b/objects.inv index 3ba6d0782e0893d074bd6c05b4e7acc7a196291f..809de9751498e53c2edbb3d21cf0e2f0380b7141 100644 GIT binary patch delta 1452 zcmV;d1ylO*3zrO#eSdG5D7d z(1MHda?d0$>79bYq+*5qW#Tg}6c;CgJJG{Q{JUdQ{9`UIo9F+Dddj-sRHk2CoAu>I zX8)3+rpQ<+3%3^zeq8G18+0*W_)a_}--NIt-@;9MTIw)tMHSIo{j~f(W<}fUT7v<=K2r9=$7m#`pOmh#M`FKHkW4?*OzW=*OQ~`8~oWOMKIRZ zv{7b_v#p@y2iaB>Z@E$xl}2BYEv+bUl7D0?Xrk&_tgU)BfD7IfToh=2|0ny@jA61>XNlZq1O zJA^KD*Bx|y>$|db+ps>zuyONT_`Dm+R&LS>Nr!z6WWDakrfDCUd^&I*Phtad^r>%o z0Nx5LIDfC>1RIg-CyBrtXnG9MGNoq`U*ItWD5eb)^OkTYScwl@RPou2AvyZ2+xNOX z#nf;#7DT8h#0J2VuWy9`xTJ~-xH1phMcg!egyRdhKaxu9w#x}1$iZ%QTOTGp7C`o(|-g#C0JZs%ytE_>oApf@R`dApQg$b1K(HA;~il9mzB! zjD<}cf*ew4D{b7uZaQHTU~o^{nlzlH%j;u0Sbs4iRc%8AhMS;FubCTXh*zfL%5)^D z`hWBQPt(Fpwl;wyndQN;IkAJUP!_J0g>Ak_~l(vKt?V?g)ah5xy0zw;t7GcyeO z_HTaf%|%cNo~NLAM-(ia_X4vJnxl>F`)vEB_yYlJ06V1LYB`Iqmlv0#d(*M89U1*e z>b-XG@G{lC9=j-i5WIQc8ih4DsfR6*v;u=6gYs#JUhvHo`e?65)V|$T@Cu;$VSkVt zkfSRwMuzQz#q%!3f4$Psw%4L$8`;+kxkrfc!Gn!?WdRUvuS|mXnmaZtP2qB zTCH^Sm=RIuGAH5IlB5*ck$56&J%7?N?L0=I?;E39*Eu?J$0Nq2y-S?QMo+k;?OdS) z80}wN+8ID!w79sVu3SgSa2^iHdZoqGx**Dik8AB{-Y|3o3y0gW=x?|(#(oRNg&_Nbn~BTSTnRus&wwyH>SVO&Qzj@MI@`s_Xk1tdn)AnTUJpbR`ftbj`qhdSwW;k zACL)1`@*~55Kc-jzI_Dqlad{r8Qe;)N*2tA97}zHw2Kg8fV1+_M$U zxX7>eO!Azr6?9B0mdRfxzR*l@aU!@CJ)Xp0AFJ%AzPPGh{wL}w^MYfUesOM=cP}vd zw{&WZ40UDZ@xtEQrJR32XY=`=#8dK(2n+JfJhZ2!_QMwRBKWAEmfyuJ$b8ZxFyDjl zP5=4#&q%8LOMlL@h6$Hx^9NycPqq|&;|g8#y2_K))!F6Ul^xsGr0DKDzA;G=wACf8 zl%C^cBPe+$n}XsESE`^=>kG1>MMI#~3lqF*;$=FCP2aKn19UNCidEaR{bzSz)R3Y- zDvlHb<)2B$%d)PRI;MSTB%C&<=)x3}oYFm(lwbv2l7F?JkzP+?O|K^nIOA1DUQU7; zO&D4-A-JIVNmL^;*!ViwGdHth=)A8wZ>z>^eebf26hUSm0SnR=VPPsIc#*^h6(mkq z2wgT+YpD9sRVB-oVR?>z;ikFpMcb4tT%;3{_Ur1&de^m$(>^h|J8&LOVggch-IW{w zuLTyImw#b`iAbBBMBo(^9fqixYDN*B;2{Jkx(owzrf@4*jt^WE;n55sDY|LO4^4TD zDdA|$h)_X@34ooiEBOI9r-}-=(wprpZX7d`1ls27iD*UQQT0QaoilN)_3~KvtNh{WV-q zk!-s=kYg0rhP0@*9KzryBGm$xj z&gx=XRCh5U6?H`fhWjj!573U Li)t1F_^W`hRXP{Vz^G=U|V;YbQMO_wEqUbN3&cH-Ce^{+nMoV-Zw>t;i_e5(N|Iyd%tnrf6mA zZcN=6e;{!B!U{Dnj+}+(%ZW?TgRWSaiiEzBa^IL_cwcGXKy8%U2==!t4Z;%4%HxJe zTEH1Dz4CELGvTXSbZ)K()V|&n;IbROA7lrl=oY*O;!o(_s!hh$&;RZ*n7{5-!+-I5 z0oCC4I@y+14EEXAvB=b>=xg&Y8A7_@ptJk0Pz$dQd7bHLC3|KExNYfF!78apQ3O?8 zd(#J9NJa+IKfvBXcEgKU#yG$+jV{jE!Wl?o42^WKaRE_ly;L1=yH@;^Hp>aNb$jIO-YnVq)uJyvU`K@AoMK()J-i zh;br=%<&yTrR6*>Uvwz3va2;?5=MO-Hopper
  • MO-Halfcheetah
  • MO-Walker2D
  • +
  • Version History
  • MO-Ant
  • MO-Swimmer
  • MO-Humanoid
  • @@ -331,6 +332,27 @@

    Release Notes

    +
    +

    v1.3.0: MO-Gymnasium 1.3.0 Release: New Mujoco v5 Environments

    +

    Released on 2024-10-28 - GitHub - PyPI

    +

    This release adds the new Mujoco v5 environments:

    +
      +
    • mo-ant-v5
    • +
    • mo-ant-2obj-v5
    • +
    • mo-hopper-v5
    • +
    • mo-hopper-2obj-v5
    • +
    • mo-walker2d-v5
    • +
    • mo-halfcheetah-v5
    • +
    • mo-humanoid-v5
    • +
    • mo-swimmer-v5
    • +
    +

    What's Changed

    + +

    Full Changelog: v1.2.0...v1.3.0

    v1.2.0: MO-Gymnasium 1.2.0 Release: Update Gymnasium to v1.0.0, New Mountaincar Environments, Documentation and Test Improvements, and more

    Released on 2024-10-16 - GitHub - PyPI

    @@ -440,7 +462,7 @@

    MO-Gymnasium 1.0.0 Release Notes

    reward = forward_reward - ctrl_cost

    With MORL, users have the flexibility to determine the compromises they desire based on their preferences for each objective. Consequently, the environments in MO-Gymnasium do not have predefined weights. Thus, MO-Gymnasium extends the capabilities of Gymnasium to the multi-objective setting, where the agents receives a vectorial reward.

    For example, here is an illustration of the multiple policies learned by an MORL agent for the mo-halfcheetah domain, balancing between saving battery and speed:

    - +

    This release marks the first mature version of MO-Gymnasium within Farama, indicating that the API is stable, and we have achieved a high level of quality in this library.

    API

    • Release Notes
        +
      • v1.3.0: MO-Gymnasium 1.3.0 Release: New Mujoco v5 Environments
      • v1.2.0: MO-Gymnasium 1.2.0 Release: Update Gymnasium to v1.0.0, New Mountaincar Environments, Documentation and Test Improvements, and more
      • v1.1.0: MO-Gymnasium 1.1.0 Release: New MuJoCo environments, Mirrored Deep Sea Treasure, Fruit Tree rendering, and more
      • v1.0.1: MO-Gymnasium 1.0.1 Release: Support Gymnasium 0.29, breakable-bottles pygame render, and more
      • @@ -711,7 +734,7 @@

        0.1.1 + diff --git a/search/index.html b/search/index.html index df58580..ff05a0f 100644 --- a/search/index.html +++ b/search/index.html @@ -249,6 +249,7 @@
      • MO-Hopper
      • MO-Halfcheetah
      • MO-Walker2D
      • +
      • Version History
      • MO-Ant
      • MO-Swimmer
      • MO-Humanoid
      • @@ -393,7 +394,7 @@ - + diff --git a/searchindex.js b/searchindex.js index 9ee8587..f4836af 100644 --- a/searchindex.js +++ b/searchindex.js @@ -1 +1 @@ -Search.setIndex({"alltitles": {"0.1.1": [[45, "release-0-1-1"]], "0.1.2": [[45, "release-0-1-2"]], "0.2.0": [[45, "release-0-2-0"]], "0.2.1": [[45, "release-0-2-1"]], "1. Create a new environment class": [[46, "create-a-new-environment-class"]], "2. Register the environment": [[46, "register-the-environment"]], "3. Test the environment": [[46, "test-the-environment"]], "4. Instantiate your environment": [[46, "instantiate-your-environment"]], "404 - Page Not Found": [[0, null]], "API": [[42, null], [43, null]], "Acknowledgements": [[3, "acknowledgements"]], "Action Space": [[4, "action-space"], [6, "action-space"], [7, "action-space"], [8, "action-space"], [9, "action-space"], [10, "action-space"], [11, "action-space"], [13, "action-space"], [14, "action-space"], [15, "action-space"], [32, "action-space"], [37, "action-space"], [38, "action-space"]], "Arguments": [[4, "arguments"], [6, "arguments"], [7, "arguments"], [8, "arguments"], [9, "arguments"], [10, "arguments"], [13, "arguments"], [14, "arguments"], [15, "arguments"], [38, "arguments"]], "Breakable-Bottles": [[4, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Citation": [[39, null]], "Citing": [[42, "citing"]], "Classic Control": [[5, null]], "Community": [[3, null]], "Creating a custom environment": [[46, null]], "Credits": [[4, "credits"], [6, "credits"], [7, "credits"], [8, "credits"], [9, "credits"], [10, "credits"], [13, "credits"], [14, "credits"], [15, "credits"], [37, "credits"], [38, "credits"]], "Deep-Sea-Treasure": [[6, null]], "Deep-Sea-Treasure-Concave": [[7, null]], "Deep-Sea-Treasure-Mirrored": [[8, null]], "Description": [[4, "description"], [6, "description"], [7, "description"], [8, "description"], [9, "description"], [10, "description"], [11, "description"], [13, "description"], [14, "description"], [15, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [22, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [32, "description"], [33, "description"], [34, "description"], [35, "description"], [37, "description"], [38, "description"]], "Episode Termination": [[4, "episode-termination"], [6, "episode-termination"], [7, "episode-termination"], [8, "episode-termination"], [10, "episode-termination"], [11, "episode-termination"], [13, "episode-termination"], [14, "episode-termination"], [15, "episode-termination"], [33, "episode-termination"], [37, "episode-termination"]], "Fishwood": [[9, null]], "Four-Room": [[10, null]], "Fruit-Tree": [[11, null]], "Grid-World": [[12, null]], "Install": [[42, "install"], [44, null]], "LinearReward": [[48, "linearreward"]], "List of Publications": [[41, null]], "MO-Ant": [[17, null]], "MO-Ant-2D": [[18, null]], "MO-Gymnasium 0.3.0 Release: Migrate to Gymnasium": [[45, "release-0-3-0"]], "MO-Gymnasium 0.3.1 Release: Improved documentation and MuJoco MO-Reacher environment": [[45, "release-0-3-1"]], "MO-Gymnasium 0.3.2 Release: Bug fixes, improved webpage": [[45, "release-0-3-2"]], "MO-Gymnasium documentation": [[1, null]], "MO-Halfcheetah": [[19, null]], "MO-Highway": [[20, null]], "MO-Highway-Fast": [[21, null]], "MO-Hopper": [[22, null]], "MO-Hopper-2D": [[23, null]], "MO-Humanoid": [[24, null]], "MO-Lunar-Lander": [[25, null]], "MO-Lunar-Lander-Continuous": [[26, null]], "MO-Mountaincar": [[27, null]], "MO-Mountaincar-3D": [[28, null]], "MO-Mountaincar-Timemove": [[29, null]], "MO-Mountaincar-Timespeed": [[30, null]], "MO-Mountaincarcontinuous": [[31, null]], "MO-Reacher": [[32, null]], "MO-Supermario": [[33, null]], "MO-Swimmer": [[34, null]], "MO-Walker2D": [[35, null]], "MOClipReward": [[48, "moclipreward"]], "MOMaxAndSkipObservation": [[48, "momaxandskipobservation"]], "MONormalizeReward": [[48, "monormalizereward"]], "MORL Baselines": [[40, null]], "MORecordEpisodeStatistics": [[47, "morecordepisodestatistics"], [48, "morecordepisodestatistics"]], "MOSyncVectorEnv": [[47, "mosyncvectorenv"]], "Minecart": [[13, null]], "Minecart-Deterministic": [[14, null]], "Minecart-Rgb": [[15, null]], "Miscellaneous": [[16, null]], "MuJoCo": [[36, null]], "Observation Space": [[4, "observation-space"], [6, "observation-space"], [7, "observation-space"], [8, "observation-space"], [9, "observation-space"], [10, "observation-space"], [11, "observation-space"], [13, "observation-space"], [14, "observation-space"], [15, "observation-space"], [32, "observation-space"], [37, "observation-space"], [38, "observation-space"]], "References": [[10, "references"]], "Release Notes": [[45, null]], "Resource-Gathering": [[37, null]], "Reward Space": [[4, "reward-space"], [6, "reward-space"], [7, "reward-space"], [8, "reward-space"], [9, "reward-space"], [10, "reward-space"], [11, "reward-space"], [13, "reward-space"], [14, "reward-space"], [15, "reward-space"], [17, "reward-space"], [18, "reward-space"], [19, "reward-space"], [20, "reward-space"], [22, "reward-space"], [23, "reward-space"], [24, "reward-space"], [25, "reward-space"], [26, "reward-space"], [32, "reward-space"], [33, "reward-space"], [34, "reward-space"], [35, "reward-space"], [37, "reward-space"], [38, "reward-space"]], "Reward space:": [[27, "reward-space"], [28, "reward-space"], [29, "reward-space"], [30, "reward-space"], [31, "reward-space"]], "Starting State": [[4, "starting-state"], [6, "starting-state"], [7, "starting-state"], [8, "starting-state"], [9, "starting-state"], [10, "starting-state"], [11, "starting-state"], [13, "starting-state"], [14, "starting-state"], [15, "starting-state"], [37, "starting-state"], [38, "starting-state"]], "Termination": [[9, "termination"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Vector Wrappers": [[47, null]], "Water-Reservoir": [[38, null]], "Wrappers": [[48, null]], "v0.3.3: MO-Gymnasium 0.3.3 Release: Policy Evaluation bug fix, better documentation page": [[45, "release-v0-3-3"]], "v0.3.4: MO-Gymnasium 0.3.4 Release: Known Pareto Front, improved renders and documentation": [[45, "release-v0-3-4"]], "v1.0.0: MO-Gymnasium becomes mature": [[45, "release-v1-0-0"]], "v1.0.1: MO-Gymnasium 1.0.1 Release: Support Gymnasium 0.29, breakable-bottles pygame render, and more": [[45, "release-v1-0-1"]], "v1.1.0: MO-Gymnasium 1.1.0 Release: New MuJoCo environments, Mirrored Deep Sea Treasure, Fruit Tree rendering, and more": [[45, "release-v1-1-0"]], "v1.2.0: MO-Gymnasium 1.2.0 Release: Update Gymnasium to v1.0.0, New Mountaincar Environments, Documentation and Test Improvements, and more": [[45, "release-v1-2-0"]]}, "docnames": ["404", "README", "citing/citing", "community/community", "environments/breakable-bottles", "environments/classical", "environments/deep-sea-treasure", "environments/deep-sea-treasure-concave", "environments/deep-sea-treasure-mirrored", "environments/fishwood", "environments/four-room", "environments/fruit-tree", "environments/grid-world", "environments/minecart", "environments/minecart-deterministic", "environments/minecart-rgb", "environments/misc", "environments/mo-ant", "environments/mo-ant-2d", "environments/mo-halfcheetah", "environments/mo-highway", "environments/mo-highway-fast", "environments/mo-hopper", "environments/mo-hopper-2d", "environments/mo-humanoid", "environments/mo-lunar-lander", "environments/mo-lunar-lander-continuous", "environments/mo-mountaincar", "environments/mo-mountaincar-3d", "environments/mo-mountaincar-timemove", "environments/mo-mountaincar-timespeed", "environments/mo-mountaincarcontinuous", "environments/mo-reacher", "environments/mo-supermario", "environments/mo-swimmer", "environments/mo-walker2d", "environments/mujoco", "environments/resource-gathering", "environments/water-reservoir", "examples/citation", "examples/morl_baselines", "examples/publications", "index", "introduction/api", "introduction/install", "release_notes", "tutorials/custom_env", "wrappers/vector_wrappers", "wrappers/wrappers"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["404.md", "README.md", "citing/citing.md", "community/community.md", "environments/breakable-bottles.md", "environments/classical.md", "environments/deep-sea-treasure.md", "environments/deep-sea-treasure-concave.md", "environments/deep-sea-treasure-mirrored.md", "environments/fishwood.md", "environments/four-room.md", "environments/fruit-tree.md", "environments/grid-world.md", "environments/minecart.md", "environments/minecart-deterministic.md", "environments/minecart-rgb.md", "environments/misc.md", "environments/mo-ant.md", "environments/mo-ant-2d.md", "environments/mo-halfcheetah.md", "environments/mo-highway.md", "environments/mo-highway-fast.md", "environments/mo-hopper.md", "environments/mo-hopper-2d.md", "environments/mo-humanoid.md", "environments/mo-lunar-lander.md", "environments/mo-lunar-lander-continuous.md", "environments/mo-mountaincar.md", "environments/mo-mountaincar-3d.md", "environments/mo-mountaincar-timemove.md", "environments/mo-mountaincar-timespeed.md", "environments/mo-mountaincarcontinuous.md", "environments/mo-reacher.md", "environments/mo-supermario.md", "environments/mo-swimmer.md", "environments/mo-walker2d.md", "environments/mujoco.md", "environments/resource-gathering.md", "environments/water-reservoir.md", "examples/citation.md", "examples/morl_baselines.md", "examples/publications.md", "index.md", "introduction/api.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "wrappers/vector_wrappers.md", "wrappers/wrappers.md"], "indexentries": {"linearreward (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.LinearReward", false]], "moclipreward (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.MOClipReward", false]], "momaxandskipobservation (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.MOMaxAndSkipObservation", false]], "monormalizereward (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.MONormalizeReward", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers)": [[48, "mo_gymnasium.wrappers.MORecordEpisodeStatistics", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers.vector)": [[47, "mo_gymnasium.wrappers.vector.MORecordEpisodeStatistics", false]], "mosyncvectorenv (class in mo_gymnasium.wrappers.vector)": [[47, "mo_gymnasium.wrappers.vector.MOSyncVectorEnv", false]]}, "objects": {"mo_gymnasium.wrappers": [[48, 0, 1, "", "LinearReward"], [48, 0, 1, "", "MOClipReward"], [48, 0, 1, "", "MOMaxAndSkipObservation"], [48, 0, 1, "", "MONormalizeReward"], [48, 0, 1, "", "MORecordEpisodeStatistics"]], "mo_gymnasium.wrappers.vector": [[47, 0, 1, "", "MORecordEpisodeStatistics"], [47, 0, 1, "", "MOSyncVectorEnv"]]}, "objnames": {"0": ["py", "class", "Python class"]}, "objtypes": {"0": "py:class"}, "terms": {"": [4, 5, 6, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 35, 42, 43, 45, 48], "0": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 47, 48], "01": 45, "02": 45, "03": 45, "06": 45, "07": [27, 28, 29, 30, 31], "08": [45, 48], "09": 45, "1": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 47, 48], "10": [6, 7, 8, 11, 12, 25, 26, 37, 38, 45], "100": [25, 26, 33, 45, 47, 48], "101": 45, "103": 45, "105": 45, "106": 45, "107": 45, "11": [6, 7, 22, 23, 45], "1109": 38, "1145": 37, "12": 45, "124": [7, 8], "13": [10, 45], "1390156": 37, "1390162": 37, "14": [10, 45], "16": 45, "160": 38, "17": [19, 24, 35], "18": 45, "19": 45, "1e": [34, 48], "2": [4, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 47], "20": [8, 45], "200": 9, "2008": [12, 37], "2010": 12, "2011": 5, "2012": 38, "2013": 16, "2017": 10, "2018": 12, "2019": [6, 7, 8, 11, 12, 13, 14, 15, 16], "2020": 36, "2021": 12, "2022": [2, 5, 12, 41, 45], "2022bnaic": 2, "2023": [39, 41, 42, 45], "2024": [41, 45], "21": 45, "23": [6, 45], "24": 45, "240": [4, 33], "25": [33, 45], "255": [15, 33], "256": 33, "25th": 37, "26": 45, "27": [17, 18, 45], "28": [25, 26], "2d": [6, 7, 8, 10, 13, 14, 15, 31, 45, 47], "3": [4, 6, 7, 8, 10, 13, 14, 15, 17, 18, 20, 21, 22, 23, 25, 26, 27, 28, 29, 30, 32, 33, 37, 38, 47], "30": 45, "31": 45, "33": 45, "34": 45, "34th": 2, "35": 45, "360": 4, "37": 45, "376": 24, "37th": [39, 42], "3d": [5, 13, 14, 15, 27, 29, 30], "4": [4, 6, 7, 8, 10, 13, 14, 15, 24, 25, 26, 32, 33, 34, 37, 38, 47, 48], "40": 45, "41": [37, 45], "42": [45, 47], "43": 45, "45": 45, "46": 45, "47": [37, 45], "480": 15, "5": [4, 11, 12, 13, 14, 15, 20, 21, 25, 26, 33, 37, 45], "50": [4, 45], "51": 45, "52": 45, "53": 45, "55": 45, "56": 45, "57": 45, "58": 45, "59": 45, "6": [11, 12, 13, 14, 15, 19, 25, 26, 27, 28, 29, 30, 31, 32, 35], "60": 45, "61": 45, "62": 45, "6252759": 38, "63": 11, "64": 45, "65": 45, "67": 45, "69": 45, "7": [6, 11, 12, 13, 14, 15, 45, 47], "70": 45, "72": 45, "73": 45, "74": 45, "75": 45, "76": 45, "77": 45, "79": 45, "8": [17, 18, 25, 26, 34, 38, 42, 43, 45], "80": 45, "81": 45, "83": 45, "84": 45, "86": 45, "87": 45, "89": 45, "9": 32, "90": 45, "91": 45, "92": 45, "93": 45, "94": 45, "95": 45, "97": 45, "99": [45, 48], "A": [2, 4, 10, 16, 17, 18, 21, 27, 28, 29, 30, 31, 38, 39, 41, 42, 43, 48], "As": [4, 42, 43], "At": 47, "But": 48, "By": [27, 28, 29, 30, 38], "For": [1, 32, 42, 43, 45, 47], "If": [3, 13, 14, 15, 17, 18, 22, 23, 38, 39, 42, 46], "In": [4, 45], "It": [40, 42, 43, 45, 46], "Of": 45, "The": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 31, 32, 33, 34, 35, 37, 38, 42, 45, 46, 47], "There": 38, "To": [1, 6, 7, 8, 42, 44], "With": 45, "_": 47, "__init__": 46, "_build": 1, "_episod": 47, "_forward_reward_weight": 45, "_modul": 48, "aama": 41, "abel": [13, 14, 15, 16], "about": [1, 5], "abov": 4, "acceler": [13, 14, 15], "accept": 45, "access": [45, 47], "account": [4, 12], "achiev": 45, "act": [42, 43, 45], "action": [5, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 36, 45, 46, 47], "action_spac": [46, 47], "acttyp": 48, "ad": [17, 18, 22, 23, 45, 46, 47], "adapt": [6, 7, 8, 10], "add": [27, 28, 29, 30, 41, 45], "add_speed_object": [27, 28, 29, 30], "addit": 5, "addition": 45, "after": [9, 45, 48], "again": 4, "agent": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 37, 38, 45], "ai": 4, "al": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 36, 41], "alegr": [2, 12, 39, 41, 42], "algorithm": [40, 42], "align": 41, "all": [3, 17, 18, 37, 42, 44, 45, 47, 48], "allow": 45, "also": [3, 16, 42, 43, 45], "altern": [27, 28, 29, 30], "alwai": [6, 7, 8], "amount": [16, 38], "amp": 45, "an": [5, 10, 27, 28, 29, 30, 33, 37, 38, 42, 43, 45, 46, 48], "ana": [2, 39, 42], "andrea": 45, "andr\u00e9": 10, "angl": 32, "angular": 32, "ani": 47, "ann": [2, 39, 42], "ansi": 38, "ansimuz": [6, 7, 8], "ant": 36, "antenv": [17, 18], "api": [40, 45, 46], "appear": 2, "appli": [4, 32, 47], "approach": 4, "approxim": 41, "ar": [3, 4, 13, 14, 15, 16, 37, 38, 45, 46, 47, 48], "arm": 32, "arrai": [10, 17, 18, 19, 22, 23, 34, 42, 43, 45, 46, 47, 48], "art": [4, 6, 7, 8, 45], "artifici": 2, "asid": 3, "ask": 3, "asset": [4, 37, 45], "assist": [4, 6, 7, 8], "associ": 45, "atari_wrapp": 48, "attribut": 46, "australia": 38, "author": [2, 39, 42], "autobuild": 1, "automat": [1, 45, 46], "avail": [45, 47, 48], "averag": 48, "avoid": [10, 16], "axel": [13, 14, 15], "axelabel": 3, "axi": [22, 23], "b": 1, "back": 45, "background": [6, 7, 8, 38], "backward": 5, "balanc": 45, "barret": 12, "barreto": 10, "barrett": 37, "base": [3, 4, 13, 14, 15, 32, 36, 38, 41, 45, 48], "baselin": 45, "baselines3": 48, "batteri": 45, "bazzan": [2, 39, 42], "becaus": 4, "been": [4, 5, 45], "befor": 47, "begin": [47, 48], "behind": 5, "benchmark": [39, 41, 42], "benefit": 45, "benelearn": 2, "benelux": 2, "between": [33, 38, 42, 45, 48], "bib": 45, "binari": [10, 11, 12], "blob": [13, 14, 15], "blue": 10, "bnaic": [2, 41], "bnj6kubtg6": 42, "booktitl": [2, 39, 42], "bool": 47, "boolean": [4, 47], "both": 48, "both_norm_env": 48, "bottl": 12, "bottle_reward": 4, "bottles_carri": 4, "bottles_deliv": [4, 12], "bottles_drop": 4, "bound": [38, 45], "box": [6, 7, 8, 17, 18, 19, 22, 23, 24, 26, 31, 34, 35, 38], "brake": [13, 14, 15], "break": 45, "breakabl": 12, "breakablebottl": 4, "brisban": 38, "bro": 33, "bruno": [2, 39, 42], "budget": 41, "buffer": 47, "buffer_length": [47, 48], "bugfix": 45, "bump": 45, "button": 45, "c": [2, 39, 42], "cai": 41, "calcul": 4, "call": 45, "callabl": 47, "can": [3, 4, 9, 11, 13, 14, 15, 27, 28, 29, 30, 38, 42, 43, 44, 45, 47, 48], "cannot": 4, "capabl": 45, "capac": [13, 14, 15], "car": [5, 27, 28, 29, 30, 45], "carb": [11, 12], "care": 47, "carri": 4, "cart": [13, 14, 15], "castelletti": 38, "catch": 9, "caus": 45, "cc": 45, "cd": 1, "cell": 12, "central": 32, "certain": [42, 44], "chanc": 12, "chang": [1, 6, 7, 8, 27, 28, 29, 30, 45], "changelog": 45, "check": [42, 43, 45], "chose": 11, "ci": 45, "circl": 10, "citat": 45, "cite": 39, "class": [5, 42, 43, 47, 48], "classic": [6, 7, 8, 46], "clip": 48, "close": 46, "co": [13, 14, 15, 32], "code": [3, 6, 7, 8, 9, 10, 13, 14, 15, 38, 45, 48], "coin": [16, 33], "colab": [42, 43], "collect": [9, 10, 11, 12, 13, 14, 15, 16, 33, 37, 45], "collis": [16, 20], "com": [3, 13, 14, 15], "combin": 45, "commit": 45, "common": 48, "commun": [42, 45], "compar": 42, "complet": 48, "compliant": 42, "compon": [10, 45, 48], "compromis": 45, "comput": [32, 45, 46], "concav": [12, 45], "concave_map": [6, 7, 8], "conduct": 45, "confer": [2, 37, 38, 39, 42], "config": [13, 14, 15], "configur": [13, 14, 15], "conflict": 45, "conor": 3, "consequ": 45, "consist": 37, "constructor": 46, "consum": [13, 14, 15], "consumpt": [5, 13, 14, 15, 16], "contain": [1, 4, 10, 11, 12, 13, 14, 15, 27, 28, 29, 30, 31, 32, 40], "content": 38, "context": 45, "continu": [5, 6, 7, 8, 16, 31, 36, 38, 45], "contribut": [1, 3, 4, 45], "contributor": [3, 45], "control": [6, 7, 8, 9, 17, 18, 19, 22, 23, 24, 34, 35], "control_cost": 45, "converg": 5, "convers": 45, "convex": [6, 7, 8], "coordin": [6, 7, 8, 37, 42], "copi": 47, "corner": [13, 14, 15], "correct": 45, "correspond": [16, 27, 28, 29, 30, 38], "cost": [17, 18, 19, 22, 23, 24, 25, 26, 34, 35, 38], "cost_flood": 16, "cost_object": [17, 18, 22, 23], "crash": [25, 26], "creat": [4, 6, 7, 8, 42, 43, 45], "creation": 45, "criteria": 37, "ctrl_cost": 45, "cumul": [47, 48], "current": [4, 6, 7, 8, 38], "custom": 45, "d": [11, 12, 41], "da": [2, 39, 42], "dall": [4, 6, 7, 8], "dam": [16, 38], "danoi": [2, 39, 42], "deal": 46, "death": 16, "decis": 38, "decomposit": 41, "deep": [3, 12, 47, 48], "deep_sea_treasur": 45, "deepseatreasur": [6, 7, 8], "default": [6, 7, 8, 13, 14, 15, 27, 28, 29, 30, 38], "deficit": 38, "deficit_wat": 16, "defin": [4, 5, 16, 32, 46], "definit": [42, 43], "deliv": [4, 12], "demand": 38, "deni": [3, 9], "dens": [13, 14, 15], "depend": [42, 44], "deprec": 45, "depth": [11, 12], "deque_s": 47, "descript": [5, 12, 16, 36], "design": [45, 47], "desir": 45, "destin": 12, "detail": [5, 42, 43], "determin": 45, "determinist": 45, "develop": 42, "deviat": 48, "di": 33, "diamond": 37, "dict": 4, "dictionari": [4, 12], "did": 4, "differ": [4, 12, 45], "dim_reward": 47, "dimens": [4, 45], "dimension": [6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 32, 33, 34, 35, 37], "directli": [45, 47, 48], "directori": 46, "dirhtml": 1, "disc_episode_return": 45, "discord": [3, 42], "discount": [46, 47, 48], "discret": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 21, 25, 27, 28, 29, 30, 32, 33, 36, 37, 45], "dissert": 5, "distanc": [32, 46], "distinct": 45, "distribut": 41, "do": 45, "doc": [1, 45], "document": [42, 46], "doe": [42, 44, 48], "doi": 38, "domain": 45, "done": [46, 47], "dot": 48, "down": [6, 7, 8, 10, 37], "downstream": 38, "dr": [47, 48], "drop": [4, 45], "dst": [12, 45], "dst_map": [6, 7, 8], "dtype": [45, 47], "due": [5, 38], "dynmorl": 3, "e": [1, 2, 4, 6, 7, 8, 12, 31, 39, 42, 45], "each": [4, 6, 7, 8, 11, 13, 14, 15, 27, 28, 29, 30, 31, 32, 45, 47], "eat": 12, "edit": 45, "effici": 41, "either": 9, "el": [2, 39, 42], "elaps": [47, 48], "elbow": 32, "element": [37, 45], "els": [10, 33, 37], "en": 48, "enabl": 45, "end": [9, 13, 14, 15, 47], "enemi": [4, 12, 16, 33, 37], "energi": 36, "engin": [25, 26], "entri": 41, "entry_point": 46, "env": [3, 5, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 35, 36, 42, 43, 45, 46, 47, 48], "env_fn": 47, "environ": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 38, 41, 42, 43, 44, 47], "episod": [9, 38, 47, 48], "epsilon": 48, "equival": 5, "error": 45, "esr": [12, 45], "essenti": [42, 46], "et": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 36, 41], "eval_mo": 45, "everi": [1, 11, 12, 48], "exampl": [10, 40, 42, 43, 45, 47, 48], "except": 48, "excess": 38, "execut": [16, 38], "exhaust": 45, "expand": 45, "expect": 9, "extend": 45, "extra": [5, 27, 28, 29, 30], "extract": 48, "ezpickl": 45, "f": [3, 38], "fair": 41, "fall": 45, "fals": [17, 18, 22, 23, 47], "famili": [42, 44], "fan": 41, "fantasi": [6, 7, 8], "far": 33, "farama": [3, 13, 14, 15, 42, 45], "fast": [16, 45], "fat": [11, 12], "featur": [3, 10, 45], "feder": 41, "felten": [2, 12, 39, 41, 42], "felten_toolkit_2023": [39, 42], "few": [45, 47, 48], "ffelten": 45, "file": [13, 14, 15, 45, 46], "fill": [13, 14, 15], "finger_tip_coord": 32, "fire": 12, "first": [2, 13, 14, 15, 38, 41, 45, 47], "fish": [9, 12], "fish_amount": 12, "fisherman": 9, "fishproba": 9, "fishwood": [3, 12, 45], "fit": 38, "fix": 10, "flag": [4, 17, 18, 22, 23, 33, 37, 46], "flexibl": 45, "float": [38, 46, 47, 48], "float32": [17, 18, 19, 22, 23, 24, 26, 31, 34, 35, 38, 47], "float_stat": [6, 7, 8], "flood": 38, "florian": [2, 39, 42], "folder": [1, 45], "follow": [2, 10, 13, 14, 15, 17, 18, 19, 22, 23, 27, 28, 29, 30, 34, 42, 43, 45, 46], "forgotten": 45, "fork": 1, "form": 47, "formerli": [2, 41], "forward": [5, 19, 22, 23, 24, 27, 28, 29, 30, 34, 35], "forward_penalti": 5, "forward_reward": 45, "found": 45, "foundat": [13, 14, 15, 45], "four": [3, 12, 32], "frame": 48, "frame_skip": [13, 14, 15], "frameskip": 48, "framework": 41, "from": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 37, 38, 45, 46, 47, 48], "front": 46, "fruit": [3, 12], "fruit_tre": 45, "fuel": [5, 13, 14, 15, 16, 25, 26, 31], "fuel_consumption_penalti": 5, "full": [11, 12, 45], "function": [42, 43, 45], "g": [10, 12, 45], "gamma": [46, 47, 48], "gather": [12, 45], "gem": [4, 12, 37], "gener": [41, 45, 46], "get": 45, "gg": 42, "ghazali": [2, 39, 42], "gif": 45, "gimelfarb": [3, 10], "github": [3, 13, 14, 15, 45], "give": 5, "given": 48, "go": [1, 9, 11, 22, 23, 27, 28, 29, 30], "goal": [10, 12, 27, 28, 29, 30, 31], "goe": 46, "goir": [2, 39, 42], "gold": [4, 12, 37], "gr": [2, 39, 42], "green": 10, "grid": [6, 7, 8], "gridworld": [10, 12], "ground": 4, "group": 45, "gt": 45, "guarante": 41, "guid": [42, 43], "gupta": 5, "gym": [2, 33, 41, 42, 43, 45], "gymnasium": [2, 5, 13, 14, 15, 16, 17, 18, 19, 22, 23, 24, 25, 26, 27, 28, 29, 30, 34, 35, 40, 41, 42, 43, 44, 46, 47, 48], "ha": [4, 5, 33, 45, 47], "halfcheetah": [36, 45], "halfcheetahenv": 19, "harder": 12, "hartmann": 41, "have": [3, 4, 5, 12, 42, 45, 48], "hay": 3, "healthi": [17, 18], "heavili": 48, "height": 36, "help": 3, "here": [3, 10, 42, 43, 45], "high": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 45], "higher": 45, "highwai": [16, 45], "highwayenv": 20, "highwayfastenv": 21, "home": [4, 37], "hopper": [36, 45], "hopperenv": [22, 23], "hotfix": 45, "how": [1, 13, 14, 15, 33, 40, 45], "html": 48, "http": [3, 4, 6, 7, 8, 13, 14, 15, 37, 38, 42, 48], "human": [13, 14, 15, 38], "humanoid": 36, "humanoidenv": 24, "humonoid": 36, "hung": 5, "hydroelectr": 38, "hyperparamet": 41, "i": [1, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 40, 42, 43, 45, 46, 47, 48], "ianleongudri": 45, "id": 46, "idx": 48, "igd": 46, "ijcnn": 38, "illustr": 45, "imag": [13, 14, 15, 16, 38], "image_observ": [13, 14, 15], "impact": 4, "implement": [4, 40, 46], "import": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 45, 46, 47, 48], "improv": 41, "includ": [16, 42, 44], "inconsist": 45, "increment": [13, 14, 15], "incremental_frame_skip": [13, 14, 15], "index": [47, 48], "indic": [4, 10, 37, 45, 47], "inf": [4, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 32, 33, 34, 35, 38], "info": [42, 43, 45, 46, 47, 48], "info_dict": 45, "inform": [1, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 39, 42], "inher": 45, "inherit": 46, "init": 45, "initi": [38, 46], "initial_st": 38, "inproceed": [2, 39, 42], "inspir": 48, "instal": 1, "instanc": [42, 43, 45], "instead": [4, 45], "int": [47, 48], "int32": 47, "integ": 46, "integr": 45, "intellig": 2, "interact": [42, 43], "intern": [37, 38], "introduc": [5, 10, 45], "invert": 46, "io": [4, 6, 7, 8, 37, 48], "issu": 45, "itch": [4, 6, 7, 8, 37], "item": [10, 12], "item1": 12, "item2": 12, "item3": 12, "iter": [38, 47], "its": 46, "ivanov": 41, "j": 45, "johnson": 45, "join": [3, 42], "joint": [32, 38], "json": [13, 14, 15], "jump": [22, 23], "kallinteri": 45, "katze2664": 45, "keep": [47, 48], "kei": [4, 47], "kill": [12, 33, 37], "klassert": 4, "known": 46, "kwarg": 46, "l": [2, 39, 42, 47, 48], "lack": 5, "lambda": 47, "land": [5, 25, 26], "lander": [5, 45], "lane": [16, 20], "larger": 4, "last": [47, 48], "leaf": [11, 12], "learn": [2, 4, 9, 10, 37, 39, 41, 42, 43, 45], "left": [4, 6, 7, 8, 10, 11, 13, 14, 15, 37], "length": [47, 48], "length_queu": 47, "leon": 37, "level": [38, 45], "leverag": 41, "librari": [2, 41, 42, 45], "life": 45, "light": 12, "like": [3, 42, 44, 48], "limezu": [4, 37], "limit": 16, "line": 46, "linear": [17, 18, 19, 22, 23, 34], "linearli": 45, "linearreward": [17, 18, 19, 22, 23, 34, 42, 43, 45], "linearwrapp": 45, "link": 45, "lint": 45, "list": [4, 45], "literatur": 45, "local": 5, "locat": [4, 12, 32], "logo": 45, "look": 48, "low": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38], "lower": 10, "luca": [2, 39, 42], "lucasalegr": 45, "lunar": [5, 45], "lunarland": [5, 25, 26], "m": 38, "machin": 37, "made": [1, 45], "mai": 45, "main": [3, 13, 14, 15, 25, 26], "main_engine_fuel": 5, "make": [1, 4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 45, 46, 47, 48], "mani": [13, 14, 15, 47], "map": [6, 7, 8, 10, 12, 13, 14, 15, 45], "mario": [33, 45], "mark": 45, "markov": 38, "master": 48, "match": 45, "mathieu": [3, 38], "max": 48, "max_r": 48, "max_t": 9, "maxandskipenv": 48, "maxima": 5, "maximum": 38, "maze": 10, "md": [1, 45], "mdp": [42, 43, 45], "mean": 48, "merg": [5, 27, 28, 29, 30], "merge_move_penalti": [27, 28, 29, 30], "method": [45, 46], "metric": 46, "mgoulao": 45, "mike": [3, 10], "min": 48, "min_r": 48, "mine": [13, 14, 15], "mine_config": [13, 14, 15], "minecart": [3, 16, 42, 43, 45], "miner": [11, 12], "minerium": [13, 14, 15], "minim": [13, 14, 15, 16], "minor": 45, "mirror": 12, "mirrored_map": [6, 7, 8], "miss": [41, 45], "mistak": 45, "mo": [2, 3, 5, 13, 14, 15, 16, 36, 40, 41, 42, 43, 44, 46, 47, 48], "mo_gym": [17, 18, 19, 22, 23, 34, 42, 43, 45, 47, 48], "mo_gymnasium": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 42, 43, 45, 46, 47, 48], "mode": [13, 14, 15, 38], "model": [41, 42, 43], "modem": 41, "modifi": 45, "modul": [47, 48], "mofl": 41, "momaxandskipobserv": 45, "momdp": [42, 43, 45], "monormalizereward": 45, "more": [1, 5, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 42, 43], "morecordepisodestatist": 45, "moreov": [46, 47], "morewordstatist": 47, "morl": [3, 6, 7, 8, 9, 42, 43, 45], "most": 47, "mountain": [5, 27, 28, 29, 30, 31, 45], "mountaincar": [5, 31], "mountaincarcontinu": [5, 45], "move": [4, 5, 33, 34, 37, 45, 48], "move_penalti": 5, "much": 33, "mujoco": [42, 44], "multi": [2, 5, 9, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33, 34, 35, 36, 38, 39, 41, 42, 43, 45, 46], "multibinari": 4, "multiobject": 4, "multipl": [4, 37, 40, 41, 45, 46, 47], "must": [12, 13, 14, 15, 16, 46], "my_env_dir": 46, "my_env_fil": 46, "my_env_v0": 46, "myenv": 46, "mypi": 45, "n": [2, 39, 42], "nO": 38, "narayanan": [12, 37], "ndarrai": 48, "need": 45, "neg": [10, 31, 32], "neighbour": 16, "network": 38, "neural": [38, 39, 42], "neurip": [39, 41, 42], "next": 46, "next_ob": [42, 43, 45], "ninjikin": [4, 37], "nip": 10, "node": 11, "none": [13, 14, 15, 38, 45, 48], "norm": 31, "norm_treasure_env": 48, "normal": [38, 45, 47, 48], "normalized_act": 38, "note": [4, 48], "notebook": [42, 43], "now": [2, 39, 42, 45], "np": [17, 18, 19, 22, 23, 34, 42, 43, 45], "num": 47, "num_env": 47, "number": [4, 38], "numpi": [42, 43, 45, 46], "nutri1": 12, "nutri6": 12, "nutrient": [11, 12], "ob": [5, 12, 16, 36, 42, 43, 45, 47], "object": [2, 5, 9, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 32, 33, 34, 35, 36, 38, 39, 41, 42, 43, 45, 46], "observ": [12, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 45, 46, 48], "observation_spac": 46, "observationspac": 45, "obstyp": 48, "off": 45, "oject": 46, "onc": 1, "one": [42, 44, 45, 48], "onli": [38, 48], "open": [41, 42], "opengameart": 38, "optim": [37, 41, 45], "option": [27, 28, 29, 30, 42, 43, 45, 46], "order": 45, "ore1": 16, "ore2": 16, "ores": [13, 14, 15, 16], "org": [38, 42], "orient": [13, 14, 15], "origin": [4, 17, 18, 19, 22, 23, 34, 42, 43, 45], "other": [16, 17, 18, 22, 23, 42, 43, 45, 48], "otherwis": [4, 9, 33], "our": [1, 45, 46], "out": [3, 38], "outcom": 4, "output": 47, "packag": [1, 45], "paper": 4, "pareto": [41, 46], "pareto_front": [45, 46], "parisi": 38, "part": [45, 46], "pass": [33, 45], "passag": 10, "path": [13, 14, 15], "paulina": 38, "penal": 38, "penalti": [4, 5, 6, 7, 8, 12, 27, 28, 29, 30, 31, 33], "peopl": 3, "percentag": 38, "perform": [45, 46], "person": 41, "pf": 45, "pianosi": [16, 38], "pick": 4, "pip": [1, 42, 44], "pixel": [4, 6, 7, 8, 45], "plan": [42, 43], "pleas": [39, 41, 42], "plu": 10, "point": 33, "polici": [37, 41], "porcentag": [13, 14, 15], "port": 38, "posit": [5, 6, 7, 8, 10, 13, 14, 15, 32, 33, 37], "possibl": [4, 32], "potenti": [4, 12, 45], "pp": 38, "practic": [42, 43], "pranav": 5, "pranavg23": 45, "pre": 45, "predefin": 45, "prefer": 45, "prevent": 5, "previous": 45, "priorit": 41, "prob_drop": 4, "probabl": [4, 9], "problem": [4, 6, 7, 8, 9, 38, 45], "problemat": [42, 44], "proceed": [2, 37, 39, 42], "process": [39, 42], "product": 48, "project": 3, "protein": [11, 12], "provid": [3, 9, 42, 45, 47], "pseudo": 45, "public": [2, 42], "publish": 41, "pull": [41, 46], "py": [45, 46], "pydoc": 45, "pypi": 45, "pytest": 46, "python": [42, 43, 45], "q": 38, "qld": 38, "qualiti": 45, "quantiti": [13, 14, 15], "question": 3, "r": [1, 47, 48], "r_i": 32, "randint": 45, "random": 38, "rang": [45, 47], "rather": 4, "reach": [3, 6, 7, 8, 10, 11, 12, 16, 27, 28, 29, 30, 31, 33, 45], "reacher": 36, "read": 5, "readm": 45, "readthedoc": 48, "reason": 5, "rebuild": 1, "receiv": [11, 45], "recent": 47, "recov": [17, 18, 19, 22, 23, 34], "red": 10, "refactor": [3, 13, 14, 15], "refer": 46, "registr": 46, "registri": 46, "reinforc": [2, 4, 9, 10, 39, 41, 42, 43, 45], "reinject": 48, "relax": [2, 39, 42], "releas": [16, 38], "reli": 45, "reliabl": [39, 41, 42], "remov": [27, 28, 29, 30], "remove_move_penalti": [27, 28, 29, 30], "renam": 45, "render": [13, 14, 15, 38, 46], "render_mod": [13, 14, 15, 38], "repeat": [13, 14, 15], "repositori": [39, 40, 42, 46], "repres": 45, "request": 41, "requir": 1, "research": [39, 41, 42], "reservoir": [3, 16, 45], "reset": [42, 43, 45, 46, 47, 48], "resourc": [12, 45], "respect": 47, "restelli": 38, "retriev": [13, 14, 15], "return": [9, 13, 14, 15, 37, 42, 45, 46, 48], "return_queu": 47, "revamp": 45, "revers": [4, 5, 27, 28, 29, 30], "reverse_penalti": 5, "reward": [5, 21, 42, 43, 45, 46, 47, 48], "reward_dim": 46, "reward_spac": [45, 46], "reymond": [3, 38], "rgb": [13, 14], "rgb_arrai": [13, 14, 15, 38], "right": [4, 6, 7, 8, 10, 11, 13, 14, 15, 20, 37], "right_lan": 16, "rightest": 16, "riva": 38, "rl": 45, "rnd": 45, "robert": 4, "rodriguez": 41, "roijer": 12, "room": [3, 12], "root": [11, 45], "run": [19, 24, 35, 46, 47], "runzheyang": 3, "safeti": 4, "same": [6, 7, 8], "sampl": [41, 47], "save": 45, "scalar": [17, 18, 19, 22, 23, 34, 42, 43, 45, 48], "scenario": 45, "scott": 45, "sea": [3, 12, 47, 48], "sebimarkgraf": 45, "second": [13, 14, 15], "section": 4, "see": [10, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 33, 34, 35, 42, 43, 45, 46], "seed": [46, 47], "select": 38, "self": [45, 46], "sens": 48, "separ": 10, "serenevillagerevamp": [4, 37], "serial": 47, "server": [3, 42], "set": [17, 18, 22, 23, 42, 45, 46], "setup": 45, "shape": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38, 46, 47], "shaped_reward": 5, "should": [45, 46], "shown": 45, "side": [25, 26], "side_engine_fuel": 5, "signal": 5, "silva": [2, 39, 42], "similar": [36, 45, 47], "similarli": [5, 16], "simon": 38, "simpl": [9, 42, 43], "simpli": 3, "sin": [13, 14, 15, 32], "sinc": [46, 47, 48], "singl": [27, 28, 29, 30, 45], "size": [4, 11, 46], "skip": 48, "sky": 38, "small": [4, 45], "smooth": 48, "snippet": 45, "so": 4, "some": [3, 42, 44, 46], "soto": 41, "sourc": [6, 7, 8, 10, 12, 13, 14, 15, 31, 42], "space": [5, 12, 16, 21, 36, 45, 46], "spars": [13, 14, 15], "specif": 47, "specifi": 4, "speed": [5, 13, 14, 15, 16, 20, 27, 28, 29, 30, 45], "speed_object": 5, "spell": 45, "sphinx": 1, "split": 10, "squar": 10, "srini": 37, "stabil": 48, "stabl": [45, 48], "stable_baselines3": 48, "stai": 16, "standard": [42, 45, 48], "static": 5, "statist": 47, "stats_kei": [47, 48], "steckelmach": [3, 9], "step": [4, 5, 6, 7, 8, 9, 27, 28, 29, 30, 31, 33, 38, 41, 42, 43, 45, 46, 47], "store": 47, "str": [47, 48], "structur": 45, "sub": 47, "submarin": [6, 7, 8, 12], "submiss": 41, "subpackag": 45, "successfulli": [25, 26], "successor": [3, 10], "suit": 42, "super": 33, "supermario": [3, 16], "supermariobro": 33, "supermariobrosenv": 16, "suppli": 38, "support": 16, "swimmer": 36, "swimmerenv": 34, "system": [39, 42, 44], "t": [47, 48], "tailor": 45, "take": [4, 12], "taken": 12, "talbi": [2, 39, 42], "target": 32, "target_1": 36, "target_2": 36, "target_3": 36, "target_4": 36, "target_i": 32, "taxonomi": 41, "termin": [42, 43, 45, 46, 47], "th": 48, "than": 4, "thank": 3, "thei": [45, 47, 48], "them": [3, 4, 5, 42, 43], "therefor": 11, "thi": [1, 4, 39, 42, 43, 44, 45, 46, 47, 48], "those": 10, "thought": 45, "three": [12, 45], "threshold": 38, "thrill": 45, "through": 46, "thu": 45, "ti": 46, "time": [1, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 27, 28, 29, 30, 31, 33, 47, 48], "time_limit": 38, "time_penalti": [4, 5, 12], "timemov": 5, "timespe": 5, "timondesch": 45, "tip": 32, "titl": [2, 39, 42], "tomekst": 45, "tool": 45, "toolkit": [39, 41, 42], "top": [27, 28, 29, 30, 31], "torqu": 32, "touch": 48, "track": [47, 48], "trade": 45, "train": 48, "transfer": [3, 10], "transform": 45, "travel": 10, "treasur": [3, 4, 12, 37, 47, 48], "tree": [3, 12, 38], "triangl": 10, "true": [4, 6, 7, 8, 13, 14, 15, 38, 47], "truncat": [38, 42, 43, 45, 46, 47], "tuto": 45, "tutori": 46, "two": [9, 13, 14, 15, 16, 32, 33, 38, 48], "txt": 1, "type": [12, 13, 14, 15, 16, 45], "u": 3, "unbreakable_bottl": 4, "unbreakablebottl": 4, "under": [40, 45], "underwat": [6, 7, 8], "unpin": 45, "until": 38, "unwrap": 45, "up": [4, 6, 7, 8, 10, 37, 38], "upper": [13, 14, 15], "upstream": 38, "us": [6, 7, 8, 13, 14, 15, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48], "usag": 45, "user": 45, "util": [9, 45], "v0": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 21, 27, 28, 29, 30, 31, 33, 36, 37, 38, 42, 43, 47, 48], "v2": [5, 45], "v3": [25, 26, 45], "v4": [17, 18, 19, 22, 23, 24, 32, 34, 35, 36, 45], "valu": [4, 6, 7, 8, 11, 12, 41], "vamplew": [5, 12], "variabl": 47, "variou": [3, 40], "vecenv": 45, "vector": [10, 11, 13, 14, 15, 27, 28, 29, 30, 31, 33, 42, 45, 46, 48], "vector_reward": [42, 43, 45], "vectorenv": 47, "vectori": 45, "vehicl": 16, "veloc": [17, 18, 24, 32, 34, 35, 36], "veri": [42, 43, 46], "version": [5, 10, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 45], "via": [41, 47], "vitamin": [11, 12], "wa": [3, 4, 5, 6, 7, 8, 13, 14, 15, 41, 45], "wai": [3, 10], "walker2d": 36, "walker2denv": 35, "wall": 10, "want": 3, "warn": [16, 45], "water": [3, 11, 12, 16, 45], "we": [3, 42, 45, 46], "websit": [42, 45], "weight": [17, 18, 19, 22, 23, 34, 42, 43, 45, 48], "welfar": 41, "well": [42, 45, 46], "were": 10, "when": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 33, 37, 45, 46], "where": [6, 7, 8, 9, 11, 27, 28, 29, 30, 31, 45], "whether": [13, 14, 15, 38], "which": [4, 5, 6, 7, 8, 9, 10, 42, 45, 46, 47, 48], "while": [4, 10, 12, 16], "within": [45, 46, 47], "wood": [9, 12], "wood_amount": 12, "woodproba": 9, "work": [42, 47], "worker": 45, "workshop": [2, 41], "world": [6, 7, 8], "would": 3, "wrap": [45, 47], "wrapped_env": 47, "wrapper": [40, 42, 43, 45], "wrt": 38, "x": [6, 7, 8, 17, 18, 22, 23, 24, 33, 34, 35, 37], "x_po": 16, "x_veloc": [36, 45], "xu": 36, "y": [6, 7, 8, 17, 18, 37], "y_veloc": 36, "yang": [6, 7, 8, 11, 12, 16], "year": [2, 39, 42], "you": [3, 39, 42, 43, 44, 45, 46], "your": [1, 39, 42], "your_ag": [42, 43, 45], "z": [22, 23], "zero": [32, 45]}, "titles": ["404 - Page Not Found", "MO-Gymnasium documentation", "<no title>", "Community", "Breakable-Bottles", "Classic Control", "Deep-Sea-Treasure", "Deep-Sea-Treasure-Concave", "Deep-Sea-Treasure-Mirrored", "Fishwood", "Four-Room", "Fruit-Tree", "Grid-World", "Minecart", "Minecart-Deterministic", "Minecart-Rgb", "Miscellaneous", "MO-Ant", "MO-Ant-2D", "MO-Halfcheetah", "MO-Highway", "MO-Highway-Fast", "MO-Hopper", "MO-Hopper-2D", "MO-Humanoid", "MO-Lunar-Lander", "MO-Lunar-Lander-Continuous", "MO-Mountaincar", "MO-Mountaincar-3D", "MO-Mountaincar-Timemove", "MO-Mountaincar-Timespeed", "MO-Mountaincarcontinuous", "MO-Reacher", "MO-Supermario", "MO-Swimmer", "MO-Walker2D", "MuJoCo", "Resource-Gathering", "Water-Reservoir", "Citation", "MORL Baselines", "List of Publications", "API", "API", "Install", "Release Notes", "Creating a custom environment", "Vector Wrappers", "Wrappers"], "titleterms": {"0": 45, "1": [45, 46], "2": [45, 46], "29": 45, "2d": [18, 23], "3": [45, 46], "3d": 28, "4": [45, 46], "404": 0, "Not": 0, "The": 0, "acknowledg": 3, "action": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 32, 37, 38], "ant": [17, 18], "api": [42, 43], "argument": [4, 6, 7, 8, 9, 10, 13, 14, 15, 38], "baselin": 40, "becom": 45, "better": 45, "bottl": [4, 45], "breakabl": [4, 45], "bug": 45, "build": 1, "citat": 39, "cite": 42, "class": 46, "classic": 5, "commun": 3, "concav": 7, "continu": 26, "control": 5, "could": 0, "creat": 46, "credit": [4, 6, 7, 8, 9, 10, 13, 14, 15, 37, 38], "custom": 46, "deep": [6, 7, 8, 45], "descript": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 32, 33, 34, 35, 37, 38], "determinist": 14, "document": [1, 45], "environ": [45, 46], "episod": [4, 6, 7, 8, 10, 11, 13, 14, 15, 33, 37], "evalu": 45, "fast": 21, "fishwood": 9, "fix": 45, "found": 0, "four": 10, "front": 45, "fruit": [11, 45], "gather": 37, "grid": 12, "gymnasium": [1, 45], "halfcheetah": 19, "highwai": [20, 21], "hopper": [22, 23], "humanoid": 24, "improv": 45, "instal": [42, 44], "instanti": 46, "known": 45, "lander": [25, 26], "linearreward": 48, "list": 41, "lunar": [25, 26], "matur": 45, "migrat": 45, "minecart": [13, 14, 15], "mirror": [8, 45], "miscellan": 16, "mo": [1, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 45], "moclipreward": 48, "momaxandskipobserv": 48, "monormalizereward": 48, "more": 45, "morecordepisodestatist": [47, 48], "morl": 40, "mosyncvectorenv": 47, "mountaincar": [27, 28, 29, 30, 45], "mountaincarcontinu": 31, "mujoco": [36, 45], "new": [45, 46], "note": 45, "observ": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 32, 37, 38], "page": [0, 45], "pareto": 45, "polici": 45, "public": 41, "pygam": 45, "reacher": [32, 45], "refer": 10, "regist": 46, "releas": 45, "render": 45, "request": 0, "reservoir": 38, "resourc": 37, "reward": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38], "rgb": 15, "room": 10, "sea": [6, 7, 8, 45], "space": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 37, 38], "start": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 37, 38], "state": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 37, 38], "supermario": 33, "support": 45, "swimmer": 34, "termin": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 33, 37], "test": [45, 46], "timemov": 29, "timespe": 30, "treasur": [6, 7, 8, 45], "tree": [11, 45], "updat": 45, "v0": 45, "v1": 45, "vector": 47, "walker2d": 35, "water": 38, "webpag": 45, "world": 12, "wrapper": [47, 48], "your": 46}}) \ No newline at end of file +Search.setIndex({"alltitles": {"0.1.1": [[47, "release-0-1-1"]], "0.1.2": [[47, "release-0-1-2"]], "0.2.0": [[47, "release-0-2-0"]], "0.2.1": [[47, "release-0-2-1"]], "1. Create a new environment class": [[48, "create-a-new-environment-class"]], "2. Register the environment": [[48, "register-the-environment"]], "3. Test the environment": [[48, "test-the-environment"]], "4. Instantiate your environment": [[48, "instantiate-your-environment"]], "404 - Page Not Found": [[0, null]], "API": [[44, null], [45, null]], "Acknowledgements": [[3, "acknowledgements"]], "Action Space": [[4, "action-space"], [6, "action-space"], [7, "action-space"], [8, "action-space"], [9, "action-space"], [10, "action-space"], [11, "action-space"], [13, "action-space"], [14, "action-space"], [15, "action-space"], [34, "action-space"], [39, "action-space"], [40, "action-space"]], "Arguments": [[4, "arguments"], [6, "arguments"], [7, "arguments"], [8, "arguments"], [9, "arguments"], [10, "arguments"], [13, "arguments"], [14, "arguments"], [15, "arguments"], [40, "arguments"]], "Breakable-Bottles": [[4, null]], "Build the Documentation": [[1, "build-the-documentation"]], "Citation": [[41, null]], "Citing": [[44, "citing"]], "Classic Control": [[5, null]], "Community": [[3, null]], "Creating a custom environment": [[48, null]], "Credits": [[4, "credits"], [6, "credits"], [7, "credits"], [8, "credits"], [9, "credits"], [10, "credits"], [13, "credits"], [14, "credits"], [15, "credits"], [39, "credits"], [40, "credits"]], "Deep-Sea-Treasure": [[6, null]], "Deep-Sea-Treasure-Concave": [[7, null]], "Deep-Sea-Treasure-Mirrored": [[8, null]], "Description": [[4, "description"], [6, "description"], [7, "description"], [8, "description"], [9, "description"], [10, "description"], [11, "description"], [13, "description"], [14, "description"], [15, "description"], [17, "description"], [18, "description"], [19, "description"], [20, "description"], [21, "description"], [23, "description"], [24, "description"], [25, "description"], [26, "description"], [27, "description"], [28, "description"], [34, "description"], [35, "description"], [36, "description"], [37, "description"], [39, "description"], [40, "description"]], "Episode Termination": [[4, "episode-termination"], [6, "episode-termination"], [7, "episode-termination"], [8, "episode-termination"], [10, "episode-termination"], [11, "episode-termination"], [13, "episode-termination"], [14, "episode-termination"], [15, "episode-termination"], [35, "episode-termination"], [39, "episode-termination"]], "Fishwood": [[9, null]], "Four-Room": [[10, null]], "Fruit-Tree": [[11, null]], "Grid-World": [[12, null]], "Install": [[44, "install"], [46, null]], "LinearReward": [[50, "linearreward"]], "List of Publications": [[43, null]], "MO-Ant": [[17, null]], "MO-Ant-2D": [[18, null]], "MO-Ant-2Obj": [[19, null]], "MO-Gymnasium 0.3.0 Release: Migrate to Gymnasium": [[47, "release-0-3-0"]], "MO-Gymnasium 0.3.1 Release: Improved documentation and MuJoco MO-Reacher environment": [[47, "release-0-3-1"]], "MO-Gymnasium 0.3.2 Release: Bug fixes, improved webpage": [[47, "release-0-3-2"]], "MO-Gymnasium documentation": [[1, null]], "MO-Halfcheetah": [[20, null]], "MO-Highway": [[21, null]], "MO-Highway-Fast": [[22, null]], "MO-Hopper": [[23, null]], "MO-Hopper-2D": [[24, null]], "MO-Hopper-2Obj": [[25, null]], "MO-Humanoid": [[26, null]], "MO-Lunar-Lander": [[27, null]], "MO-Lunar-Lander-Continuous": [[28, null]], "MO-Mountaincar": [[29, null]], "MO-Mountaincar-3D": [[30, null]], "MO-Mountaincar-Timemove": [[31, null]], "MO-Mountaincar-Timespeed": [[32, null]], "MO-Mountaincarcontinuous": [[33, null]], "MO-Reacher": [[34, null]], "MO-Supermario": [[35, null]], "MO-Swimmer": [[36, null]], "MO-Walker2D": [[37, null]], "MOClipReward": [[50, "moclipreward"]], "MOMaxAndSkipObservation": [[50, "momaxandskipobservation"]], "MONormalizeReward": [[50, "monormalizereward"]], "MORL Baselines": [[42, null]], "MORecordEpisodeStatistics": [[49, "morecordepisodestatistics"], [50, "morecordepisodestatistics"]], "MOSyncVectorEnv": [[49, "mosyncvectorenv"]], "Minecart": [[13, null]], "Minecart-Deterministic": [[14, null]], "Minecart-Rgb": [[15, null]], "Miscellaneous": [[16, null]], "MuJoCo": [[38, null]], "Observation Space": [[4, "observation-space"], [6, "observation-space"], [7, "observation-space"], [8, "observation-space"], [9, "observation-space"], [10, "observation-space"], [11, "observation-space"], [13, "observation-space"], [14, "observation-space"], [15, "observation-space"], [34, "observation-space"], [39, "observation-space"], [40, "observation-space"]], "References": [[10, "references"]], "Release Notes": [[47, null]], "Resource-Gathering": [[39, null]], "Reward Space": [[4, "reward-space"], [6, "reward-space"], [7, "reward-space"], [8, "reward-space"], [9, "reward-space"], [10, "reward-space"], [11, "reward-space"], [13, "reward-space"], [14, "reward-space"], [15, "reward-space"], [17, "reward-space"], [18, "reward-space"], [19, "reward-space"], [20, "reward-space"], [21, "reward-space"], [23, "reward-space"], [24, "reward-space"], [25, "reward-space"], [26, "reward-space"], [27, "reward-space"], [28, "reward-space"], [34, "reward-space"], [35, "reward-space"], [36, "reward-space"], [37, "reward-space"], [39, "reward-space"], [40, "reward-space"]], "Reward space:": [[29, "reward-space"], [30, "reward-space"], [31, "reward-space"], [32, "reward-space"], [33, "reward-space"]], "Starting State": [[4, "starting-state"], [6, "starting-state"], [7, "starting-state"], [8, "starting-state"], [9, "starting-state"], [10, "starting-state"], [11, "starting-state"], [13, "starting-state"], [14, "starting-state"], [15, "starting-state"], [39, "starting-state"], [40, "starting-state"]], "Termination": [[9, "termination"]], "The requested page could not be found.": [[0, "the-requested-page-could-not-be-found"]], "Vector Wrappers": [[49, null]], "Version History": [[17, "version-history"], [19, "version-history"], [20, "version-history"], [23, "version-history"], [25, "version-history"], [37, "version-history"]], "Version History:": [[26, "version-history"], [34, "version-history"], [36, "version-history"]], "Water-Reservoir": [[40, null]], "Wrappers": [[50, null]], "v0.3.3: MO-Gymnasium 0.3.3 Release: Policy Evaluation bug fix, better documentation page": [[47, "release-v0-3-3"]], "v0.3.4: MO-Gymnasium 0.3.4 Release: Known Pareto Front, improved renders and documentation": [[47, "release-v0-3-4"]], "v1.0.0: MO-Gymnasium becomes mature": [[47, "release-v1-0-0"]], "v1.0.1: MO-Gymnasium 1.0.1 Release: Support Gymnasium 0.29, breakable-bottles pygame render, and more": [[47, "release-v1-0-1"]], "v1.1.0: MO-Gymnasium 1.1.0 Release: New MuJoCo environments, Mirrored Deep Sea Treasure, Fruit Tree rendering, and more": [[47, "release-v1-1-0"]], "v1.2.0: MO-Gymnasium 1.2.0 Release: Update Gymnasium to v1.0.0, New Mountaincar Environments, Documentation and Test Improvements, and more": [[47, "release-v1-2-0"]], "v1.3.0: MO-Gymnasium 1.3.0 Release: New Mujoco v5 Environments": [[47, "release-v1-3-0"]]}, "docnames": ["404", "README", "citing/citing", "community/community", "environments/breakable-bottles", "environments/classical", "environments/deep-sea-treasure", "environments/deep-sea-treasure-concave", "environments/deep-sea-treasure-mirrored", "environments/fishwood", "environments/four-room", "environments/fruit-tree", "environments/grid-world", "environments/minecart", "environments/minecart-deterministic", "environments/minecart-rgb", "environments/misc", "environments/mo-ant", "environments/mo-ant-2d", "environments/mo-ant-2obj", "environments/mo-halfcheetah", "environments/mo-highway", "environments/mo-highway-fast", "environments/mo-hopper", "environments/mo-hopper-2d", "environments/mo-hopper-2obj", "environments/mo-humanoid", "environments/mo-lunar-lander", "environments/mo-lunar-lander-continuous", "environments/mo-mountaincar", "environments/mo-mountaincar-3d", "environments/mo-mountaincar-timemove", "environments/mo-mountaincar-timespeed", "environments/mo-mountaincarcontinuous", "environments/mo-reacher", "environments/mo-supermario", "environments/mo-swimmer", "environments/mo-walker2d", "environments/mujoco", "environments/resource-gathering", "environments/water-reservoir", "examples/citation", "examples/morl_baselines", "examples/publications", "index", "introduction/api", "introduction/install", "release_notes", "tutorials/custom_env", "wrappers/vector_wrappers", "wrappers/wrappers"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["404.md", "README.md", "citing/citing.md", "community/community.md", "environments/breakable-bottles.md", "environments/classical.md", "environments/deep-sea-treasure.md", "environments/deep-sea-treasure-concave.md", "environments/deep-sea-treasure-mirrored.md", "environments/fishwood.md", "environments/four-room.md", "environments/fruit-tree.md", "environments/grid-world.md", "environments/minecart.md", "environments/minecart-deterministic.md", "environments/minecart-rgb.md", "environments/misc.md", "environments/mo-ant.md", "environments/mo-ant-2d.md", "environments/mo-ant-2obj.md", "environments/mo-halfcheetah.md", "environments/mo-highway.md", "environments/mo-highway-fast.md", "environments/mo-hopper.md", "environments/mo-hopper-2d.md", "environments/mo-hopper-2obj.md", "environments/mo-humanoid.md", "environments/mo-lunar-lander.md", "environments/mo-lunar-lander-continuous.md", "environments/mo-mountaincar.md", "environments/mo-mountaincar-3d.md", "environments/mo-mountaincar-timemove.md", "environments/mo-mountaincar-timespeed.md", "environments/mo-mountaincarcontinuous.md", "environments/mo-reacher.md", "environments/mo-supermario.md", "environments/mo-swimmer.md", "environments/mo-walker2d.md", "environments/mujoco.md", "environments/resource-gathering.md", "environments/water-reservoir.md", "examples/citation.md", "examples/morl_baselines.md", "examples/publications.md", "index.md", "introduction/api.md", "introduction/install.md", "release_notes.md", "tutorials/custom_env.md", "wrappers/vector_wrappers.md", "wrappers/wrappers.md"], "indexentries": {"linearreward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.LinearReward", false]], "moclipreward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MOClipReward", false]], "momaxandskipobservation (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MOMaxAndSkipObservation", false]], "monormalizereward (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MONormalizeReward", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers)": [[50, "mo_gymnasium.wrappers.MORecordEpisodeStatistics", false]], "morecordepisodestatistics (class in mo_gymnasium.wrappers.vector)": [[49, "mo_gymnasium.wrappers.vector.MORecordEpisodeStatistics", false]], "mosyncvectorenv (class in mo_gymnasium.wrappers.vector)": [[49, "mo_gymnasium.wrappers.vector.MOSyncVectorEnv", false]]}, "objects": {"mo_gymnasium.wrappers": [[50, 0, 1, "", "LinearReward"], [50, 0, 1, "", "MOClipReward"], [50, 0, 1, "", "MOMaxAndSkipObservation"], [50, 0, 1, "", "MONormalizeReward"], [50, 0, 1, "", "MORecordEpisodeStatistics"]], "mo_gymnasium.wrappers.vector": [[49, 0, 1, "", "MORecordEpisodeStatistics"], [49, 0, 1, "", "MOSyncVectorEnv"]]}, "objnames": {"0": ["py", "class", "Python class"]}, "objtypes": {"0": "py:class"}, "terms": {"": [4, 5, 6, 7, 8, 10, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 37, 44, 45, 47, 50], "0": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 49, 50], "01": 47, "02": 47, "03": 47, "06": 47, "07": [29, 30, 31, 32, 33], "08": [47, 50], "09": 47, "1": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 49, 50], "10": [6, 7, 8, 11, 12, 27, 28, 39, 40, 47], "100": [27, 28, 35, 47, 49, 50], "101": 47, "103": 47, "105": [17, 19, 47], "106": 47, "107": 47, "108": 47, "109": 47, "11": [6, 7, 23, 24, 25, 47], "1109": 40, "1145": 39, "12": 47, "124": [7, 8], "13": [10, 47], "1390156": 39, "1390162": 39, "14": [10, 47], "16": 47, "160": 40, "17": [20, 26, 37], "18": 47, "19": 47, "1e": [23, 25, 36, 37, 50], "2": [4, 6, 7, 8, 9, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 49], "20": [8, 47], "200": 9, "2008": [12, 39], "2010": 12, "2011": 5, "2012": 40, "2013": 16, "2017": 10, "2018": 12, "2019": [6, 7, 8, 11, 12, 13, 14, 15, 16], "2020": 38, "2021": 12, "2022": [2, 5, 12, 43, 47], "2022bnaic": 2, "2023": [41, 43, 44, 47], "2024": [43, 47], "21": 47, "23": [6, 47], "24": 47, "240": [4, 35], "25": [26, 35, 47], "255": [15, 35], "256": 35, "25th": 39, "26": 47, "27": [18, 47], "28": [27, 28, 47], "2d": [6, 7, 8, 10, 13, 14, 15, 17, 19, 23, 25, 33, 47, 49], "2obj": [17, 23, 47], "3": [4, 6, 7, 8, 10, 13, 14, 15, 17, 18, 19, 21, 22, 23, 24, 25, 27, 28, 29, 30, 31, 32, 34, 35, 37, 39, 40, 49], "30": 47, "31": 47, "33": 47, "34": 47, "348": 26, "34th": 2, "35": 47, "360": 4, "37": 47, "37th": [41, 44], "3d": [5, 13, 14, 15, 29, 31, 32], "4": [4, 6, 7, 8, 10, 13, 14, 15, 26, 27, 28, 34, 35, 36, 39, 40, 49, 50], "40": 47, "41": [39, 47], "42": [47, 49], "43": 47, "45": 47, "46": 47, "47": [39, 47], "480": 15, "5": [4, 11, 12, 13, 14, 15, 21, 22, 27, 28, 35, 39, 47], "50": [4, 47], "51": 47, "52": 47, "53": 47, "55": 47, "56": 47, "57": 47, "58": 47, "59": 47, "6": [11, 12, 13, 14, 15, 20, 27, 28, 29, 30, 31, 32, 33, 34, 37], "60": 47, "61": 47, "62": 47, "6252759": 40, "63": 11, "64": 47, "65": 47, "67": 47, "69": 47, "7": [6, 11, 12, 13, 14, 15, 47, 49], "70": 47, "72": 47, "73": 47, "74": 47, "75": 47, "76": 47, "77": 47, "79": 47, "8": [17, 18, 19, 27, 28, 36, 40, 44, 45, 47], "80": 47, "81": 47, "83": 47, "84": 47, "85": 47, "86": 47, "87": 47, "89": 47, "9": 34, "90": 47, "91": 47, "92": 47, "93": 47, "94": 47, "95": 47, "97": 47, "99": [47, 50], "A": [2, 4, 10, 16, 17, 18, 19, 22, 23, 25, 29, 30, 31, 32, 33, 40, 41, 43, 44, 45, 50], "As": [4, 44, 45], "At": 49, "But": 50, "By": [29, 30, 31, 32, 40], "For": [1, 34, 44, 45, 47, 49], "If": [3, 13, 14, 15, 17, 18, 19, 23, 24, 25, 40, 41, 44, 48], "In": [4, 47], "It": [42, 44, 45, 47, 48], "Of": 47, "The": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 33, 34, 35, 36, 37, 39, 40, 44, 47, 48, 49], "There": 40, "To": [1, 6, 7, 8, 44, 46], "With": 47, "_": 49, "__init__": 48, "_build": 1, "_episod": 49, "_forward_reward_weight": 47, "_modul": 50, "aama": 43, "abel": [13, 14, 15, 16], "about": [1, 5], "abov": 4, "acceler": [13, 14, 15], "accept": 47, "access": [47, 49], "account": [4, 12], "achiev": 47, "act": [44, 45, 47], "action": [5, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 38, 47, 48, 49], "action_spac": [48, 49], "acttyp": 50, "ad": [17, 18, 19, 23, 24, 25, 47, 48, 49], "adapt": [6, 7, 8, 10], "add": [29, 30, 31, 32, 43, 47], "add_speed_object": [29, 30, 31, 32], "addit": 5, "addition": 47, "after": [9, 47, 50], "again": 4, "agent": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 39, 40, 47], "ai": 4, "al": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 38, 43], "alegr": [2, 12, 41, 43, 44], "algorithm": [42, 44], "align": 43, "all": [3, 17, 18, 19, 39, 44, 46, 47, 49, 50], "allow": 47, "also": [3, 16, 44, 45, 47], "altern": [29, 30, 31, 32], "alwai": [6, 7, 8], "amount": [16, 40], "amp": 47, "an": [5, 10, 29, 30, 31, 32, 35, 39, 40, 44, 45, 47, 48, 50], "ana": [2, 41, 44], "andrea": 47, "andr\u00e9": 10, "angl": 34, "angular": 34, "ani": 49, "ann": [2, 41, 44], "ansi": 40, "ansimuz": [6, 7, 8], "ant": [38, 47], "antenv": [17, 18, 19], "api": [42, 47, 48], "appear": 2, "appli": [4, 34, 49], "approach": 4, "approxim": 43, "ar": [3, 4, 13, 14, 15, 16, 39, 40, 47, 48, 49, 50], "arm": 34, "arrai": [10, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 48, 49, 50], "art": [4, 6, 7, 8, 47], "artifici": 2, "asid": 3, "ask": 3, "asset": [4, 39, 47], "assist": [4, 6, 7, 8], "associ": 47, "atari_wrapp": 50, "attribut": 48, "australia": 40, "author": [2, 41, 44], "autobuild": 1, "automat": [1, 47, 48], "avail": [47, 49, 50], "averag": 50, "avoid": [10, 16], "axel": [13, 14, 15], "axelabel": 3, "axi": [23, 24, 25], "b": 1, "back": 47, "background": [6, 7, 8, 40], "backward": 5, "balanc": 47, "barret": 12, "barreto": 10, "barrett": 39, "base": [3, 4, 13, 14, 15, 34, 38, 40, 43, 47, 50], "baselin": 47, "baselines3": 50, "batteri": 47, "bazzan": [2, 41, 44], "becaus": 4, "been": [4, 5, 47], "befor": 49, "begin": [49, 50], "behind": 5, "benchmark": [41, 43, 44], "benefit": 47, "benelearn": 2, "benelux": 2, "between": [35, 40, 44, 47, 50], "bib": 47, "binari": [10, 11, 12], "blob": [13, 14, 15], "blue": 10, "bnaic": [2, 43], "bnj6kubtg6": 44, "booktitl": [2, 41, 44], "bool": 49, "boolean": [4, 49], "both": 50, "both_norm_env": 50, "bottl": 12, "bottle_reward": 4, "bottles_carri": 4, "bottles_deliv": [4, 12], "bottles_drop": 4, "bound": [40, 47], "box": [6, 7, 8, 17, 18, 19, 20, 23, 24, 25, 26, 28, 33, 36, 37, 40], "brake": [13, 14, 15], "break": 47, "breakabl": 12, "breakablebottl": 4, "brisban": 40, "bro": 35, "bruno": [2, 41, 44], "budget": 43, "buffer": 49, "buffer_length": [49, 50], "bugfix": 47, "bump": 47, "button": 47, "c": [2, 41, 44], "cai": 43, "calcul": 4, "call": 47, "callabl": 49, "can": [3, 4, 9, 11, 13, 14, 15, 17, 19, 23, 25, 29, 30, 31, 32, 40, 44, 45, 46, 47, 49, 50], "cannot": 4, "capabl": 47, "capac": [13, 14, 15], "car": [5, 29, 30, 31, 32, 47], "carb": [11, 12], "care": 49, "carri": 4, "cart": [13, 14, 15], "castelletti": 40, "catch": 9, "caus": 47, "cc": 47, "cd": 1, "cell": 12, "central": 34, "certain": [44, 46], "chanc": 12, "chang": [1, 6, 7, 8, 20, 26, 29, 30, 31, 32, 47], "changelog": 47, "check": [44, 45, 47], "chose": 11, "ci": 47, "circl": 10, "citat": 47, "cite": 41, "class": [5, 44, 45, 49, 50], "classic": [6, 7, 8, 48], "clip": 50, "close": 48, "co": [13, 14, 15, 34], "code": [3, 6, 7, 8, 9, 10, 13, 14, 15, 40, 47, 50], "coin": [16, 35], "colab": [44, 45], "collect": [9, 10, 11, 12, 13, 14, 15, 16, 35, 39, 47], "collis": [16, 21], "com": [3, 13, 14, 15], "combin": 47, "commit": 47, "common": 50, "commun": [44, 47], "compar": 44, "complet": 50, "compliant": 44, "compon": [10, 47, 50], "compromis": 47, "comput": [34, 47, 48], "concav": [12, 47], "concave_map": [6, 7, 8], "conduct": 47, "confer": [2, 39, 40, 41, 44], "config": [13, 14, 15], "configur": [13, 14, 15], "conflict": 47, "conor": 3, "consequ": 47, "consist": 39, "constructor": 48, "consum": [13, 14, 15], "consumpt": [5, 13, 14, 15, 16], "contact": [17, 19, 26], "contain": [1, 4, 10, 11, 12, 13, 14, 15, 29, 30, 31, 32, 33, 34, 42], "content": 40, "context": 47, "continu": [5, 6, 7, 8, 16, 33, 38, 40, 47], "contribut": [1, 3, 4, 47], "contributor": [3, 47], "control": [6, 7, 8, 9, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "control_cost": 47, "converg": 5, "convers": 47, "convex": [6, 7, 8], "coordin": [6, 7, 8, 39, 44], "copi": 49, "corner": [13, 14, 15], "correct": 47, "correspond": [16, 29, 30, 31, 32, 40], "cost": [17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 36, 37, 40], "cost_flood": 16, "cost_object": [17, 18, 19, 23, 24, 25], "crash": [27, 28], "creat": [4, 6, 7, 8, 44, 45, 47], "creation": 47, "criteria": 39, "ctrl_cost": 47, "cumul": [49, 50], "current": [4, 6, 7, 8, 40], "custom": 47, "d": [11, 12, 43], "da": [2, 41, 44], "dall": [4, 6, 7, 8], "dam": [16, 40], "danoi": [2, 41, 44], "deal": 48, "death": 16, "decis": 40, "decomposit": 43, "deep": [3, 12, 49, 50], "deep_sea_treasur": 47, "deepseatreasur": [6, 7, 8], "default": [6, 7, 8, 13, 14, 15, 29, 30, 31, 32, 40], "deficit": 40, "deficit_wat": 16, "defin": [4, 5, 16, 34, 48], "definit": [44, 45], "deliv": [4, 12], "demand": 40, "deni": [3, 9], "dens": [13, 14, 15], "dep": 47, "depend": [44, 46], "deprec": 47, "depth": [11, 12], "deque_s": 49, "descript": [5, 12, 16, 38], "design": [47, 49], "desir": 47, "destin": 12, "detail": [5, 44, 45], "determin": 47, "determinist": 47, "develop": 44, "deviat": 50, "di": 35, "diamond": 39, "dict": 4, "dictionari": [4, 12], "did": 4, "differ": [4, 12, 47], "dim_reward": 49, "dimens": [4, 47], "dimension": [6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 39], "directli": [47, 49, 50], "directori": 48, "dirhtml": 1, "disc_episode_return": 47, "discord": [3, 44], "discount": [48, 49, 50], "discret": [4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 21, 22, 27, 29, 30, 31, 32, 34, 35, 38, 39, 47], "dissert": 5, "distanc": [34, 48], "distinct": 47, "distribut": 43, "do": 47, "doc": [1, 47], "document": [44, 48], "doe": [44, 46, 50], "doi": 40, "domain": 47, "done": [48, 49], "dot": 50, "down": [6, 7, 8, 10, 39], "downstream": 40, "dr": [49, 50], "drop": [4, 47], "dst": [12, 47], "dst_map": [6, 7, 8], "dtype": [47, 49], "due": [5, 40], "dynmorl": 3, "e": [1, 2, 4, 6, 7, 8, 12, 33, 41, 44, 47], "each": [4, 6, 7, 8, 11, 13, 14, 15, 29, 30, 31, 32, 33, 34, 47, 49], "eat": 12, "edit": 47, "effici": 43, "either": 9, "el": [2, 41, 44], "elaps": [49, 50], "elbow": 34, "element": [39, 47], "els": [10, 35, 39], "en": 50, "enabl": 47, "end": [9, 13, 14, 15, 49], "enemi": [4, 12, 16, 35, 39], "energi": 38, "engin": [27, 28], "entri": 43, "entry_point": 48, "env": [3, 5, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 36, 37, 38, 44, 45, 47, 48, 49, 50], "env_fn": 49, "environ": [2, 4, 5, 6, 7, 8, 9, 10, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 40, 43, 44, 45, 46, 49], "episod": [9, 40, 49, 50], "epsilon": 50, "equival": 5, "error": 47, "esr": [12, 47], "essenti": [44, 48], "et": [5, 6, 7, 8, 10, 11, 12, 13, 14, 15, 16, 38, 43], "eval_mo": 47, "everi": [1, 11, 12, 50], "exampl": [10, 42, 44, 45, 47, 49, 50], "except": 50, "excess": 40, "execut": [16, 40], "exhaust": 47, "expand": 47, "expect": 9, "extend": 47, "extra": [5, 29, 30, 31, 32], "extract": 50, "ezpickl": 47, "f": [3, 40], "fair": 43, "fall": 47, "fals": [17, 18, 19, 23, 24, 25, 49], "famili": [44, 46], "fan": 43, "fantasi": [6, 7, 8], "far": 35, "farama": [3, 13, 14, 15, 17, 19, 20, 23, 25, 26, 34, 36, 37, 44, 47], "fast": [16, 47], "fat": [11, 12], "featur": [3, 10, 47], "feder": 43, "felten": [2, 12, 41, 43, 44], "felten_toolkit_2023": [41, 44], "few": [47, 49, 50], "ffelten": 47, "file": [13, 14, 15, 47, 48], "fill": [13, 14, 15], "finger_tip_coord": 34, "fire": 12, "first": [2, 13, 14, 15, 40, 43, 47, 49], "fish": [9, 12], "fish_amount": 12, "fisherman": 9, "fishproba": 9, "fishwood": [3, 12, 47], "fit": 40, "fix": 10, "flag": [4, 17, 18, 19, 23, 24, 25, 35, 39, 48], "flexibl": 47, "float": [40, 48, 49, 50], "float32": [17, 18, 19, 20, 23, 24, 25, 26, 28, 33, 36, 37, 40, 49], "float_stat": [6, 7, 8], "flood": 40, "florian": [2, 41, 44], "folder": [1, 47], "follow": [2, 10, 13, 14, 15, 17, 18, 19, 20, 23, 24, 25, 26, 29, 30, 31, 32, 36, 37, 44, 45, 47, 48], "forc": [17, 19, 26], "forgotten": 47, "fork": 1, "form": 49, "formerli": [2, 43], "forward": [5, 20, 23, 24, 25, 26, 29, 30, 31, 32, 36, 37], "forward_penalti": 5, "forward_reward": 47, "found": 47, "foundat": [13, 14, 15, 47], "four": [3, 12, 34], "frame": 50, "frame_skip": [13, 14, 15], "frameskip": 50, "framework": 43, "from": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 20, 26, 39, 40, 47, 48, 49, 50], "front": 48, "fruit": [3, 12], "fruit_tre": 47, "fuel": [5, 13, 14, 15, 16, 27, 28, 33], "fuel_consumption_penalti": 5, "full": [11, 12, 47], "function": [44, 45, 47], "g": [10, 12, 47], "gamma": [48, 49, 50], "gather": [12, 47], "gem": [4, 12, 39], "gener": [43, 47, 48], "get": 47, "gg": 44, "ghazali": [2, 41, 44], "gif": 47, "gimelfarb": [3, 10], "github": [3, 13, 14, 15, 47], "give": 5, "given": 50, "go": [1, 9, 11, 23, 24, 25, 29, 30, 31, 32], "goal": [10, 12, 29, 30, 31, 32, 33], "goe": 48, "goir": [2, 41, 44], "gold": [4, 12, 39], "gr": [2, 41, 44], "green": 10, "grid": [6, 7, 8], "gridworld": [10, 12], "ground": 4, "group": 47, "gt": 47, "guarante": 43, "guid": [44, 45], "gupta": 5, "gym": [2, 35, 43, 44, 45, 47], "gymnasium": [2, 5, 13, 14, 15, 16, 17, 18, 19, 20, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 36, 37, 42, 43, 44, 45, 46, 48, 49, 50], "ha": [4, 5, 17, 19, 20, 23, 25, 26, 35, 47, 49], "half_cheetah": 20, "halfcheetah": [38, 47], "halfcheetahenv": 20, "harder": 12, "hartmann": 43, "have": [3, 4, 5, 12, 44, 47, 50], "hay": 3, "healthi": [17, 18, 19], "heavili": 50, "height": 38, "help": 3, "here": [3, 10, 44, 45, 47], "high": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 47], "higher": 47, "highwai": [16, 47], "highwayenv": 21, "highwayfastenv": 22, "home": [4, 39], "hopper": [38, 47], "hopperenv": [23, 24, 25], "hotfix": 47, "how": [1, 13, 14, 15, 35, 42, 47], "html": 50, "http": [3, 4, 6, 7, 8, 13, 14, 15, 17, 19, 20, 23, 25, 26, 34, 36, 37, 39, 40, 44, 50], "human": [13, 14, 15, 40], "humanoid": [38, 47], "humanoidenv": 26, "humonoid": 38, "hung": 5, "hydroelectr": 40, "hyperparamet": 43, "i": [1, 3, 4, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 42, 44, 45, 47, 48, 49, 50], "ianleongudri": 47, "id": [17, 19, 23, 25, 48], "idx": 50, "igd": 48, "ijcnn": 40, "illustr": 47, "imag": [13, 14, 15, 16, 40], "image_observ": [13, 14, 15], "impact": 4, "implement": [4, 42, 48], "import": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "improv": 43, "includ": [16, 17, 19, 26, 44, 46], "inconsist": 47, "increment": [13, 14, 15], "incremental_frame_skip": [13, 14, 15], "index": [49, 50], "indic": [4, 10, 39, 47, 49], "inf": [4, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 40], "info": [44, 45, 47, 48, 49, 50], "info_dict": 47, "inform": [1, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 41, 44], "inher": 47, "inherit": 48, "init": 47, "initi": [40, 48], "initial_st": 40, "inproceed": [2, 41, 44], "inspir": 50, "instal": 1, "instanc": [44, 45, 47], "instanti": [17, 19, 23, 25], "instead": [4, 17, 19, 23, 25, 47], "int": [49, 50], "int32": 49, "integ": 48, "integr": 47, "intellig": 2, "interact": [44, 45], "intern": [39, 40], "introduc": [5, 10, 47], "invert": 48, "io": [4, 6, 7, 8, 39, 50], "issu": 47, "itch": [4, 6, 7, 8, 39], "item": [10, 12], "item1": 12, "item2": 12, "item3": 12, "iter": [40, 49], "its": 48, "ivanov": 43, "j": 47, "johnson": 47, "join": [3, 44], "joint": [34, 40], "json": [13, 14, 15], "jump": [23, 24, 25], "kallinteri": 47, "katze2664": 47, "keep": [49, 50], "kei": [4, 49], "kill": [12, 35, 39], "klassert": 4, "known": 48, "kwarg": 48, "l": [2, 41, 44, 49, 50], "lack": 5, "lambda": 49, "land": [5, 27, 28], "lander": [5, 47], "lane": [16, 21], "larger": 4, "last": [49, 50], "leaf": [11, 12], "learn": [2, 4, 9, 10, 39, 41, 43, 44, 45, 47], "left": [4, 6, 7, 8, 10, 11, 13, 14, 15, 39], "length": [49, 50], "length_queu": 49, "leon": 39, "level": [40, 47], "leverag": 43, "librari": [2, 43, 44, 47], "life": 47, "light": 12, "like": [3, 44, 46, 50], "limezu": [4, 39], "limit": 16, "line": 48, "linear": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "linearli": 47, "linearreward": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "linearwrapp": 47, "link": 47, "lint": 47, "list": [4, 47], "literatur": 47, "local": 5, "locat": [4, 12, 34], "logo": 47, "look": 50, "low": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "lower": 10, "luca": [2, 41, 44], "lucasalegr": 47, "lunar": [5, 47], "lunarland": [5, 27, 28], "m": 40, "machin": 39, "made": [1, 47], "mai": 47, "main": [3, 13, 14, 15, 27, 28, 36, 37], "main_engine_fuel": 5, "make": [1, 4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "mani": [13, 14, 15, 49], "map": [6, 7, 8, 10, 12, 13, 14, 15, 47], "mario": [35, 47], "mark": 47, "markov": 40, "master": 50, "match": 47, "mathieu": [3, 40], "max": 50, "max_r": 50, "max_t": 9, "maxandskipenv": 50, "maxima": 5, "maximum": 40, "maze": 10, "md": [1, 47], "mdp": [44, 45, 47], "mean": 50, "merg": [5, 29, 30, 31, 32], "merge_move_penalti": [29, 30, 31, 32], "method": [47, 48], "metric": 48, "mgoulao": 47, "mike": [3, 10], "min": 50, "min_r": 50, "mine": [13, 14, 15], "mine_config": [13, 14, 15], "minecart": [3, 16, 44, 45, 47], "miner": [11, 12], "minerium": [13, 14, 15], "minim": [13, 14, 15, 16], "minor": 47, "mirror": 12, "mirrored_map": [6, 7, 8], "miss": [43, 47], "mistak": 47, "mo": [2, 3, 5, 13, 14, 15, 16, 38, 42, 43, 44, 45, 46, 48, 49, 50], "mo_gym": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 49, 50], "mo_gymnasium": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 44, 45, 47, 48, 49, 50], "mode": [13, 14, 15, 40], "model": [43, 44, 45], "modem": 43, "modifi": 47, "modul": [49, 50], "mofl": 43, "momaxandskipobserv": 47, "momdp": [44, 45, 47], "monormalizereward": 47, "more": [1, 5, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 44, 45], "morecordepisodestatist": 47, "moreov": [48, 49], "morewordstatist": 49, "morl": [3, 6, 7, 8, 9, 44, 45, 47], "most": 49, "mountain": [5, 29, 30, 31, 32, 33, 47], "mountaincar": [5, 33], "mountaincarcontinu": [5, 47], "move": [4, 5, 35, 36, 39, 47, 50], "move_penalti": 5, "much": 35, "mujoco": [17, 19, 20, 23, 25, 26, 34, 36, 37, 44, 46], "multi": [2, 5, 9, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 40, 41, 43, 44, 45, 47, 48], "multibinari": 4, "multiobject": 4, "multipl": [4, 39, 42, 43, 47, 48, 49], "must": [12, 13, 14, 15, 16, 48], "my_env_dir": 48, "my_env_fil": 48, "my_env_v0": 48, "myenv": 48, "mypi": 47, "n": [2, 41, 44], "nO": 40, "narayanan": [12, 39], "ndarrai": 50, "need": 47, "neg": [10, 33, 34], "neighbour": 16, "network": 40, "neural": [40, 41, 44], "neurip": [41, 43, 44], "next": 48, "next_ob": [44, 45, 47], "ninjikin": [4, 39], "nip": 10, "node": 11, "none": [13, 14, 15, 40, 47, 50], "norm": 33, "norm_treasure_env": 50, "normal": [40, 47, 49, 50], "normalized_act": 40, "note": [4, 50], "notebook": [44, 45], "now": [2, 17, 19, 23, 25, 26, 41, 44, 47], "np": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "num": 49, "num_env": 49, "number": [4, 40], "numpi": [44, 45, 47, 48], "nutri1": 12, "nutri6": 12, "nutrient": [11, 12], "ob": [5, 12, 16, 38, 44, 45, 47, 49], "object": [2, 5, 9, 12, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 34, 35, 36, 37, 38, 40, 41, 43, 44, 45, 47, 48], "observ": [12, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 35, 36, 37, 47, 48, 50], "observation_spac": 48, "observationspac": 47, "obstyp": 50, "off": 47, "oject": 48, "onc": 1, "one": [44, 46, 47, 50], "onli": [40, 50], "open": [43, 44], "opengameart": 40, "optim": [39, 43, 47], "option": [29, 30, 31, 32, 44, 45, 47, 48], "order": 47, "ore1": 16, "ore2": 16, "ores": [13, 14, 15, 16], "org": [17, 19, 20, 23, 25, 26, 34, 36, 37, 40, 44], "orient": [13, 14, 15], "origin": [4, 17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47], "other": [16, 17, 18, 19, 20, 23, 24, 25, 44, 45, 47, 50], "otherwis": [4, 9, 35], "our": [1, 47, 48], "out": [3, 40], "outcom": 4, "output": 49, "packag": [1, 47], "paper": 4, "pareto": [43, 48], "pareto_front": [47, 48], "parisi": 40, "part": [47, 48], "pass": [35, 47], "passag": 10, "path": [13, 14, 15], "paulina": 40, "penal": 40, "penalti": [4, 5, 6, 7, 8, 12, 29, 30, 31, 32, 33, 35], "peopl": 3, "percentag": 40, "perform": [47, 48], "person": 43, "pf": 47, "pianosi": [16, 40], "pick": 4, "pip": [1, 44, 46], "pixel": [4, 6, 7, 8, 47], "plan": [44, 45], "pleas": [41, 43, 44], "plu": 10, "point": 35, "polici": [39, 43], "porcentag": [13, 14, 15], "port": 40, "posit": [5, 6, 7, 8, 10, 13, 14, 15, 34, 35, 39], "possibl": [4, 34], "potenti": [4, 12, 47], "pp": 40, "practic": [44, 45], "pranav": 5, "pranavg23": 47, "pre": 47, "predefin": 47, "prefer": 47, "prevent": 5, "previous": 47, "priorit": 43, "prob_drop": 4, "probabl": [4, 9], "problem": [4, 6, 7, 8, 9, 40, 47], "problemat": [44, 46], "proceed": [2, 39, 41, 44], "process": [41, 44], "product": 50, "project": 3, "protein": [11, 12], "provid": [3, 9, 44, 47, 49], "pseudo": 47, "public": [2, 44], "publish": 43, "pull": [43, 48], "py": [47, 48], "pydoc": 47, "pymoo": 47, "pypi": 47, "pytest": 48, "python": [44, 45, 47], "q": 40, "qld": 40, "qualiti": 47, "quantiti": [13, 14, 15], "question": 3, "r": [1, 49, 50], "r_i": 34, "randint": 47, "random": 40, "rang": [47, 49], "rather": 4, "reach": [3, 6, 7, 8, 10, 11, 12, 16, 29, 30, 31, 32, 33, 35, 47], "reacher": 38, "read": 5, "readm": 47, "readthedoc": 50, "reason": 5, "rebuild": 1, "receiv": [11, 47], "recent": 49, "recov": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37], "red": 10, "refactor": [3, 13, 14, 15], "refer": 48, "registr": 48, "registri": 48, "reinforc": [2, 4, 9, 10, 41, 43, 44, 45, 47], "reinject": 50, "relax": [2, 41, 44], "releas": [16, 40], "reli": 47, "reliabl": [41, 43, 44], "remov": [29, 30, 31, 32, 47], "remove_move_penalti": [29, 30, 31, 32], "renam": 47, "render": [13, 14, 15, 40, 48], "render_mod": [13, 14, 15, 40], "repeat": [13, 14, 15], "repositori": [41, 42, 44, 48], "repres": 47, "request": 43, "requir": 1, "research": [41, 43, 44], "reservoir": [3, 16, 47], "reset": [44, 45, 47, 48, 49, 50], "resourc": [12, 47], "respect": 49, "restelli": 40, "retriev": [13, 14, 15], "return": [9, 13, 14, 15, 39, 44, 47, 48, 50], "return_queu": 49, "revamp": 47, "revers": [4, 5, 29, 30, 31, 32], "reverse_penalti": 5, "reward": [5, 22, 44, 45, 47, 48, 49, 50], "reward_dim": 48, "reward_spac": [47, 48], "reymond": [3, 40], "rgb": [13, 14], "rgb_arrai": [13, 14, 15, 40], "right": [4, 6, 7, 8, 10, 11, 13, 14, 15, 21, 39], "right_lan": 16, "rightest": 16, "riva": 40, "rl": 47, "rnd": 47, "robert": 4, "rodriguez": 43, "roijer": 12, "room": [3, 12], "root": [11, 47], "run": [20, 26, 37, 48, 49], "runzheyang": 3, "safeti": 4, "same": [6, 7, 8], "sampl": [43, 49], "save": 47, "scalar": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 50], "scale": [20, 26], "scenario": 47, "scott": 47, "sea": [3, 12, 49, 50], "sebimarkgraf": 47, "second": [13, 14, 15], "section": 4, "see": [10, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 44, 45, 47, 48], "seed": [48, 49], "select": 40, "self": [47, 48], "sens": 50, "separ": [10, 17, 19, 23, 25], "serenevillagerevamp": [4, 39], "serial": 49, "server": [3, 44], "set": [17, 18, 19, 23, 24, 25, 44, 47, 48], "setup": 47, "shape": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40, 48, 49], "shaped_reward": 5, "should": [47, 48], "shown": 47, "side": [27, 28], "side_engine_fuel": 5, "signal": 5, "silva": [2, 41, 44], "similar": [38, 47, 49], "similarli": [5, 16], "simon": 40, "simpl": [9, 44, 45], "simpli": 3, "sin": [13, 14, 15, 34], "sinc": [48, 49, 50], "singl": [29, 30, 31, 32, 47], "size": [4, 11, 48], "skip": 50, "sky": 40, "small": [4, 47], "smooth": 50, "snippet": 47, "so": 4, "some": [3, 44, 46, 48], "soto": 43, "sourc": [6, 7, 8, 10, 12, 13, 14, 15, 33, 44], "space": [5, 12, 16, 22, 38, 47, 48], "spars": [13, 14, 15], "specif": 49, "specifi": 4, "speed": [5, 13, 14, 15, 16, 21, 29, 30, 31, 32, 47], "speed_object": 5, "spell": 47, "sphinx": 1, "split": 10, "squar": 10, "srini": 39, "stabil": 50, "stabl": [47, 50], "stable_baselines3": 50, "stai": 16, "standard": [44, 47, 50], "static": 5, "statist": 49, "stats_kei": [49, 50], "steckelmach": [3, 9], "step": [4, 5, 6, 7, 8, 9, 29, 30, 31, 32, 33, 35, 40, 43, 44, 45, 47, 48, 49], "store": 49, "str": [49, 50], "structur": 47, "sub": 49, "submarin": [6, 7, 8, 12], "submiss": 43, "subpackag": 47, "successfulli": [27, 28], "successor": [3, 10], "suit": 44, "super": 35, "supermario": [3, 16], "supermariobro": 35, "supermariobrosenv": 16, "suppli": 40, "support": 16, "swimmer": [38, 47], "swimmerenv": 36, "system": [41, 44, 46], "t": [49, 50], "tailor": 47, "take": [4, 12], "taken": 12, "talbi": [2, 41, 44], "target": 34, "target_1": 38, "target_2": 38, "target_3": 38, "target_4": 38, "target_i": 34, "taxonomi": 43, "termin": [44, 45, 47, 48, 49], "th": 50, "than": 4, "thank": 3, "thei": [47, 49, 50], "them": [3, 4, 5, 44, 45], "therefor": 11, "thi": [1, 4, 41, 44, 45, 46, 47, 48, 49, 50], "those": 10, "thought": 47, "three": [12, 47], "threshold": 40, "thrill": 47, "through": 48, "thu": 47, "ti": 48, "time": [1, 4, 5, 6, 7, 8, 12, 13, 14, 15, 16, 29, 30, 31, 32, 33, 35, 49, 50], "time_limit": 40, "time_penalti": [4, 5, 12], "timemov": 5, "timespe": 5, "timondesch": 47, "tip": 34, "titl": [2, 41, 44], "tomekst": 47, "tool": 47, "toolkit": [41, 43, 44], "top": [29, 30, 31, 32, 33], "torqu": 34, "touch": 50, "track": [49, 50], "trade": 47, "train": 50, "transfer": [3, 10], "transform": 47, "travel": 10, "treasur": [3, 4, 12, 39, 49, 50], "tree": [3, 12, 40], "triangl": 10, "true": [4, 6, 7, 8, 13, 14, 15, 40, 49], "truncat": [40, 44, 45, 47, 48, 49], "tuto": 47, "tutori": 48, "two": [9, 13, 14, 15, 16, 34, 35, 40, 50], "txt": 1, "type": [12, 13, 14, 15, 16, 47], "u": 3, "unbreakable_bottl": 4, "unbreakablebottl": 4, "under": [42, 47], "underwat": [6, 7, 8], "unpin": 47, "until": 40, "unwrap": 47, "up": [4, 6, 7, 8, 10, 39, 40], "upper": [13, 14, 15], "upstream": 40, "us": [6, 7, 8, 13, 14, 15, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50], "usag": 47, "user": 47, "util": [9, 47], "v0": [3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 21, 22, 29, 30, 31, 32, 33, 35, 38, 39, 40, 44, 45, 49, 50], "v2": [5, 47], "v3": [27, 28, 47], "v4": [17, 18, 19, 20, 23, 24, 25, 26, 34, 38, 47], "v5": [17, 19, 20, 23, 25, 26, 34, 36, 37], "valu": [4, 6, 7, 8, 11, 12, 43], "vamplew": [5, 12], "variabl": 49, "variou": [3, 42], "vecenv": 47, "vector": [10, 11, 13, 14, 15, 29, 30, 31, 32, 33, 35, 44, 47, 48, 50], "vector_reward": [44, 45, 47], "vectorenv": 49, "vectori": 47, "vehicl": 16, "veloc": [17, 18, 19, 26, 34, 36, 37, 38], "veri": [44, 45, 48], "version": [5, 10, 12, 16, 18, 21, 22, 24, 27, 28, 29, 30, 31, 32, 33, 35, 38, 47], "via": [17, 19, 23, 25, 43, 49], "vitamin": [11, 12], "wa": [3, 4, 5, 6, 7, 8, 13, 14, 15, 43, 47], "wai": [3, 10], "walker2d": [38, 47], "walker2denv": 37, "wall": 10, "want": 3, "warn": [16, 47], "water": [3, 11, 12, 16, 47], "we": [3, 44, 47, 48], "websit": [44, 47], "weight": [17, 18, 19, 20, 23, 24, 25, 26, 36, 37, 44, 45, 47, 50], "welfar": 43, "well": [44, 47, 48], "were": 10, "what": 47, "when": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 35, 39, 47, 48], "where": [6, 7, 8, 9, 11, 29, 30, 31, 32, 33, 47], "whether": [13, 14, 15, 40], "which": [4, 5, 6, 7, 8, 9, 10, 44, 47, 48, 49, 50], "while": [4, 10, 12, 16], "within": [47, 48, 49], "without": [17, 19, 23, 25], "wood": [9, 12], "wood_amount": 12, "woodproba": 9, "work": [44, 49], "worker": 47, "workshop": [2, 43], "world": [6, 7, 8], "would": 3, "wrap": [47, 49], "wrapped_env": 49, "wrapper": [42, 44, 45, 47], "wrt": 40, "x": [6, 7, 8, 17, 18, 19, 23, 24, 25, 26, 35, 36, 37, 39], "x_po": 16, "x_veloc": [38, 47], "xu": 38, "y": [6, 7, 8, 17, 18, 19, 39], "y_veloc": 38, "yang": [6, 7, 8, 11, 12, 16], "year": [2, 41, 44], "you": [3, 41, 44, 45, 46, 47, 48], "your": [1, 41, 44], "your_ag": [44, 45, 47], "z": [23, 24, 25], "zero": [34, 47]}, "titles": ["404 - Page Not Found", "MO-Gymnasium documentation", "<no title>", "Community", "Breakable-Bottles", "Classic Control", "Deep-Sea-Treasure", "Deep-Sea-Treasure-Concave", "Deep-Sea-Treasure-Mirrored", "Fishwood", "Four-Room", "Fruit-Tree", "Grid-World", "Minecart", "Minecart-Deterministic", "Minecart-Rgb", "Miscellaneous", "MO-Ant", "MO-Ant-2D", "MO-Ant-2Obj", "MO-Halfcheetah", "MO-Highway", "MO-Highway-Fast", "MO-Hopper", "MO-Hopper-2D", "MO-Hopper-2Obj", "MO-Humanoid", "MO-Lunar-Lander", "MO-Lunar-Lander-Continuous", "MO-Mountaincar", "MO-Mountaincar-3D", "MO-Mountaincar-Timemove", "MO-Mountaincar-Timespeed", "MO-Mountaincarcontinuous", "MO-Reacher", "MO-Supermario", "MO-Swimmer", "MO-Walker2D", "MuJoCo", "Resource-Gathering", "Water-Reservoir", "Citation", "MORL Baselines", "List of Publications", "API", "API", "Install", "Release Notes", "Creating a custom environment", "Vector Wrappers", "Wrappers"], "titleterms": {"0": 47, "1": [47, 48], "2": [47, 48], "29": 47, "2d": [18, 24], "2obj": [19, 25], "3": [47, 48], "3d": 30, "4": [47, 48], "404": 0, "Not": 0, "The": 0, "acknowledg": 3, "action": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 34, 39, 40], "ant": [17, 18, 19], "api": [44, 45], "argument": [4, 6, 7, 8, 9, 10, 13, 14, 15, 40], "baselin": 42, "becom": 47, "better": 47, "bottl": [4, 47], "breakabl": [4, 47], "bug": 47, "build": 1, "citat": 41, "cite": 44, "class": 48, "classic": 5, "commun": 3, "concav": 7, "continu": 28, "control": 5, "could": 0, "creat": 48, "credit": [4, 6, 7, 8, 9, 10, 13, 14, 15, 39, 40], "custom": 48, "deep": [6, 7, 8, 47], "descript": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 34, 35, 36, 37, 39, 40], "determinist": 14, "document": [1, 47], "environ": [47, 48], "episod": [4, 6, 7, 8, 10, 11, 13, 14, 15, 35, 39], "evalu": 47, "fast": 22, "fishwood": 9, "fix": 47, "found": 0, "four": 10, "front": 47, "fruit": [11, 47], "gather": 39, "grid": 12, "gymnasium": [1, 47], "halfcheetah": 20, "highwai": [21, 22], "histori": [17, 19, 20, 23, 25, 26, 34, 36, 37], "hopper": [23, 24, 25], "humanoid": 26, "improv": 47, "instal": [44, 46], "instanti": 48, "known": 47, "lander": [27, 28], "linearreward": 50, "list": 43, "lunar": [27, 28], "matur": 47, "migrat": 47, "minecart": [13, 14, 15], "mirror": [8, 47], "miscellan": 16, "mo": [1, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 47], "moclipreward": 50, "momaxandskipobserv": 50, "monormalizereward": 50, "more": 47, "morecordepisodestatist": [49, 50], "morl": 42, "mosyncvectorenv": 49, "mountaincar": [29, 30, 31, 32, 47], "mountaincarcontinu": 33, "mujoco": [38, 47], "new": [47, 48], "note": 47, "observ": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 34, 39, 40], "page": [0, 47], "pareto": 47, "polici": 47, "public": 43, "pygam": 47, "reacher": [34, 47], "refer": 10, "regist": 48, "releas": 47, "render": 47, "request": 0, "reservoir": 40, "resourc": 39, "reward": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "rgb": 15, "room": 10, "sea": [6, 7, 8, 47], "space": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 17, 18, 19, 20, 21, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 39, 40], "start": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 39, 40], "state": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 39, 40], "supermario": 35, "support": 47, "swimmer": 36, "termin": [4, 6, 7, 8, 9, 10, 11, 13, 14, 15, 35, 39], "test": [47, 48], "timemov": 31, "timespe": 32, "treasur": [6, 7, 8, 47], "tree": [11, 47], "updat": 47, "v0": 47, "v1": 47, "v5": 47, "vector": 49, "version": [17, 19, 20, 23, 25, 26, 34, 36, 37], "walker2d": 37, "water": 40, "webpag": 47, "world": 12, "wrapper": [49, 50], "your": 48}}) \ No newline at end of file diff --git a/tutorials/custom_env/index.html b/tutorials/custom_env/index.html index 5e0ae12..6f16774 100644 --- a/tutorials/custom_env/index.html +++ b/tutorials/custom_env/index.html @@ -252,6 +252,7 @@
      • MO-Hopper
      • MO-Halfcheetah
      • MO-Walker2D
      • +
      • Version History
      • MO-Ant
      • MO-Swimmer
      • MO-Humanoid
      • @@ -465,7 +466,7 @@

        4. Instantiate your environment + diff --git a/wrappers/vector_wrappers/index.html b/wrappers/vector_wrappers/index.html index d0fee15..411a0dd 100644 --- a/wrappers/vector_wrappers/index.html +++ b/wrappers/vector_wrappers/index.html @@ -252,6 +252,7 @@
      • MO-Hopper
      • MO-Halfcheetah
      • MO-Walker2D
      • +
      • Version History
      • MO-Ant
      • MO-Swimmer
      • MO-Humanoid
      • @@ -514,7 +515,7 @@

        MORecordEpisode - + diff --git a/wrappers/wrappers/index.html b/wrappers/wrappers/index.html index 22a8655..444ce2c 100644 --- a/wrappers/wrappers/index.html +++ b/wrappers/wrappers/index.html @@ -252,6 +252,7 @@
      • MO-Hopper
      • MO-Halfcheetah
      • MO-Walker2D
      • +
      • Version History
      • MO-Ant
      • MO-Swimmer
      • MO-Humanoid
      • @@ -526,7 +527,7 @@

        MOMaxAndSkipObs - +