From acad2a0ee04d03c37f5691bf9cf16c7ef71abc1c Mon Sep 17 00:00:00 2001
From: Kallinteris Andreas
 <30759571+Kallinteris-Andreas@users.noreply.github.com>
Date: Sat, 10 Feb 2024 16:51:33 +0200
Subject: [PATCH 1/4] pin `pyright==1.1.347` (match gymnasium) (#209)

---
 .pre-commit-config.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index 6ebaea8c..38f51360 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -39,7 +39,7 @@ repos:
         language: node
         pass_filenames: false
         types: [python]
-        additional_dependencies: ["pyright"]
+        additional_dependencies: ["pyright@1.1.347"]
         args:
           - --project=pyproject.toml
   - repo: https://github.com/pycqa/pydocstyle

From 12a336a4bdf3f1607691a582b29aea2e4b70110b Mon Sep 17 00:00:00 2001
From: Kallinteris Andreas
 <30759571+Kallinteris-Andreas@users.noreply.github.com>
Date: Sat, 17 Feb 2024 14:55:01 +0200
Subject: [PATCH 2/4]  `gymnasium==1.0` support (#211)

* WIP `gymnasium==1.0` support

* some fixes

* add `unwrapped` to `env` in `tests`

* `pre-commit`

* update DOCs `import` before `make`

* Update pyproject.toml

* Update pyproject.toml

* added `MazeEnv.model` and `MazeEnv.data`
---
 docs/content/multi-goal_api.md                  |  3 +++
 docs/envs/franka_kitchen/index.md               |  3 +++
 docs/envs/shadow_dexterous_hand/index.md        |  3 +++
 docs/index.md                                   |  4 ++++
 gymnasium_robotics/__init__.py                  |  4 +++-
 .../envs/adroit_hand/adroit_door.py             |  3 +++
 .../envs/adroit_hand/adroit_hammer.py           |  3 +++
 .../envs/adroit_hand/adroit_pen.py              |  3 +++
 .../envs/adroit_hand/adroit_relocate.py         |  3 +++
 gymnasium_robotics/envs/fetch/pick_and_place.py |  6 ++++++
 gymnasium_robotics/envs/fetch/push.py           |  6 ++++++
 gymnasium_robotics/envs/fetch/reach.py          |  6 ++++++
 gymnasium_robotics/envs/fetch/slide.py          |  6 ++++++
 .../envs/franka_kitchen/kitchen_env.py          |  4 ++++
 gymnasium_robotics/envs/maze/ant_maze.py        |  8 ++++++++
 gymnasium_robotics/envs/maze/ant_maze_v4.py     | 17 +++++++++++++++++
 gymnasium_robotics/envs/maze/point_maze.py      | 17 +++++++++++++++++
 .../envs/multiagent_mujoco/mujoco_multi.py      |  2 +-
 .../shadow_dexterous_hand/manipulate_block.py   |  7 ++++++-
 .../shadow_dexterous_hand/manipulate_egg.py     |  6 ++++++
 .../shadow_dexterous_hand/manipulate_pen.py     |  7 ++++++-
 pyproject.toml                                  |  4 ++--
 tests/envs/franka_kitchen/test_kitchen_env.py   |  4 ++--
 tests/envs/hand/test_manipulate.py              |  2 +-
 .../envs/hand/test_manipulate_touch_sensors.py  |  2 +-
 tests/envs/hand/test_reach.py                   |  2 +-
 tests/test_envs.py                              |  2 +-
 27 files changed, 125 insertions(+), 12 deletions(-)

diff --git a/docs/content/multi-goal_api.md b/docs/content/multi-goal_api.md
index 1c396ac8..d4458dfa 100644
--- a/docs/content/multi-goal_api.md
+++ b/docs/content/multi-goal_api.md
@@ -21,6 +21,9 @@ goal, e.g. state derived from the simulation.
 
 ```python
 import gymnasium as gym
+import gymnasium_robotics
+
+gym.register_envs(gymnasium_robotics)
 
 env = gym.make("FetchReach-v2")
 env.reset()
diff --git a/docs/envs/franka_kitchen/index.md b/docs/envs/franka_kitchen/index.md
index 7a20ab2c..7b54c5f5 100644
--- a/docs/envs/franka_kitchen/index.md
+++ b/docs/envs/franka_kitchen/index.md
@@ -16,6 +16,9 @@ The tasks can be selected when the environment is initialized passing a list of
 ```python
 
 import gymnasium as gym
+import gymnasium_robotics
+
+gym.register_envs(gymnasium_robotics)
 
 env = gym.make('FrankaKitchen-v1', tasks_to_complete=['microwave', 'kettle'])
 ```
diff --git a/docs/envs/shadow_dexterous_hand/index.md b/docs/envs/shadow_dexterous_hand/index.md
index c874e348..ae93485e 100644
--- a/docs/envs/shadow_dexterous_hand/index.md
+++ b/docs/envs/shadow_dexterous_hand/index.md
@@ -22,6 +22,9 @@ These environments are instanceated by adding the following strings to the Hand
 
 ```python
 import gymnasium as gym
+import gymnasium_robotics
+
+gym.register_envs(gymnasium_robotics)
 
 env = gym.make('HandManipulateEgg_BooleanTouchSensors-v1')
 ```
diff --git a/docs/index.md b/docs/index.md
index 6294ee8d..f40b7a63 100644
--- a/docs/index.md
+++ b/docs/index.md
@@ -52,6 +52,10 @@ The creation and interaction with the robotic environments follow the Gymnasium
 ```{code-block} python
 
 import gymnasium as gym
+import gymnasium_robotics
+
+gym.register_envs(gymnasium_robotics)
+
 env = gym.make("FetchPickAndPlace-v2", render_mode="human")
 observation, info = env.reset(seed=42)
 for _ in range(1000):
diff --git a/gymnasium_robotics/__init__.py b/gymnasium_robotics/__init__.py
index 326547d4..1b1c37d4 100644
--- a/gymnasium_robotics/__init__.py
+++ b/gymnasium_robotics/__init__.py
@@ -5,6 +5,8 @@
 from gymnasium_robotics.envs.maze import maps
 from gymnasium_robotics.envs.multiagent_mujoco import mamujoco_v0
 
+__version__ = "1.2.4"
+
 
 def register_robotics_envs():
     """Register all environment ID's to Gymnasium."""
@@ -1237,7 +1239,7 @@ def _merge(a, b):
     )
 
 
-__version__ = "1.2.4"
+register_robotics_envs()
 
 
 try:
diff --git a/gymnasium_robotics/envs/adroit_hand/adroit_door.py b/gymnasium_robotics/envs/adroit_hand/adroit_door.py
index 323222ab..e2d02caa 100644
--- a/gymnasium_robotics/envs/adroit_hand/adroit_door.py
+++ b/gymnasium_robotics/envs/adroit_hand/adroit_door.py
@@ -163,6 +163,9 @@ class AdroitHandDoorEnv(MujocoEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('AdroitHandDoor-v1', max_episode_steps=400)
     ```
diff --git a/gymnasium_robotics/envs/adroit_hand/adroit_hammer.py b/gymnasium_robotics/envs/adroit_hand/adroit_hammer.py
index 8d4c6c0d..af68a408 100644
--- a/gymnasium_robotics/envs/adroit_hand/adroit_hammer.py
+++ b/gymnasium_robotics/envs/adroit_hand/adroit_hammer.py
@@ -172,6 +172,9 @@ class AdroitHandHammerEnv(MujocoEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('AdroitHandHammer-v1', max_episode_steps=400)
     ```
diff --git a/gymnasium_robotics/envs/adroit_hand/adroit_pen.py b/gymnasium_robotics/envs/adroit_hand/adroit_pen.py
index 5e0f6517..37e4e2e6 100644
--- a/gymnasium_robotics/envs/adroit_hand/adroit_pen.py
+++ b/gymnasium_robotics/envs/adroit_hand/adroit_pen.py
@@ -165,6 +165,9 @@ class AdroitHandPenEnv(MujocoEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('AdroitHandPen-v1', max_episode_steps=400)
     ```
diff --git a/gymnasium_robotics/envs/adroit_hand/adroit_relocate.py b/gymnasium_robotics/envs/adroit_hand/adroit_relocate.py
index 8cb41138..db9031cf 100644
--- a/gymnasium_robotics/envs/adroit_hand/adroit_relocate.py
+++ b/gymnasium_robotics/envs/adroit_hand/adroit_relocate.py
@@ -165,6 +165,9 @@ class AdroitHandRelocateEnv(MujocoEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('AdroitHandRelocate-v1', max_episode_steps=400)
     ```
diff --git a/gymnasium_robotics/envs/fetch/pick_and_place.py b/gymnasium_robotics/envs/fetch/pick_and_place.py
index b6d0673c..74b5ed21 100644
--- a/gymnasium_robotics/envs/fetch/pick_and_place.py
+++ b/gymnasium_robotics/envs/fetch/pick_and_place.py
@@ -92,6 +92,9 @@ class MujocoFetchPickAndPlaceEnv(MujocoFetchEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('FetchPickAndPlaceDense-v2')
     ```
@@ -118,6 +121,9 @@ class MujocoFetchPickAndPlaceEnv(MujocoFetchEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('FetchPickAndPlace-v2', max_episode_steps=100)
     ```
diff --git a/gymnasium_robotics/envs/fetch/push.py b/gymnasium_robotics/envs/fetch/push.py
index 57545ac9..10a87282 100644
--- a/gymnasium_robotics/envs/fetch/push.py
+++ b/gymnasium_robotics/envs/fetch/push.py
@@ -120,6 +120,9 @@ class MujocoFetchPushEnv(MujocoFetchEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('FetchPushDense-v2')
     ```
@@ -146,6 +149,9 @@ class MujocoFetchPushEnv(MujocoFetchEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('FetchPush-v2', max_episode_steps=100)
     ```
diff --git a/gymnasium_robotics/envs/fetch/reach.py b/gymnasium_robotics/envs/fetch/reach.py
index 19e2b6cf..962fd74d 100644
--- a/gymnasium_robotics/envs/fetch/reach.py
+++ b/gymnasium_robotics/envs/fetch/reach.py
@@ -82,6 +82,9 @@ class MujocoFetchReachEnv(MujocoFetchEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('FetchReachDense-v2')
     ```
@@ -104,6 +107,9 @@ class MujocoFetchReachEnv(MujocoFetchEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('FetchReach-v2', max_episode_steps=100)
     ```
diff --git a/gymnasium_robotics/envs/fetch/slide.py b/gymnasium_robotics/envs/fetch/slide.py
index bc0dbf4e..1381b4a5 100644
--- a/gymnasium_robotics/envs/fetch/slide.py
+++ b/gymnasium_robotics/envs/fetch/slide.py
@@ -120,6 +120,9 @@ class MujocoFetchSlideEnv(MujocoFetchEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('FetchSlideDense-v2')
     ```
@@ -145,6 +148,9 @@ class MujocoFetchSlideEnv(MujocoFetchEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('FetchSlide-v2', max_episode_steps=100)
     ```
diff --git a/gymnasium_robotics/envs/franka_kitchen/kitchen_env.py b/gymnasium_robotics/envs/franka_kitchen/kitchen_env.py
index beba0af9..a8c0c3cc 100644
--- a/gymnasium_robotics/envs/franka_kitchen/kitchen_env.py
+++ b/gymnasium_robotics/envs/franka_kitchen/kitchen_env.py
@@ -64,6 +64,10 @@ class KitchenEnv(GoalEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
+
     env = gym.make('FrankaKitchen-v1', tasks_to_complete=['microwave', 'kettle'])
     ```
 
diff --git a/gymnasium_robotics/envs/maze/ant_maze.py b/gymnasium_robotics/envs/maze/ant_maze.py
index b586e9e8..d1395e78 100644
--- a/gymnasium_robotics/envs/maze/ant_maze.py
+++ b/gymnasium_robotics/envs/maze/ant_maze.py
@@ -122,3 +122,11 @@ def render(self):
     def close(self):
         super().close()
         self.ant_env.close()
+
+    @property
+    def model(self):
+        return self.ant_env.model
+
+    @property
+    def data(self):
+        return self.ant_env.data
diff --git a/gymnasium_robotics/envs/maze/ant_maze_v4.py b/gymnasium_robotics/envs/maze/ant_maze_v4.py
index bf8ec0f2..edcf7f5e 100644
--- a/gymnasium_robotics/envs/maze/ant_maze_v4.py
+++ b/gymnasium_robotics/envs/maze/ant_maze_v4.py
@@ -65,6 +65,9 @@ class AntMazeEnv(MazeEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     example_map = [[1, 1, 1, 1, 1],
            [1, C, 0, C, 1],
@@ -158,6 +161,9 @@ class AntMazeEnv(MazeEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('AntMaze_UMaze-v4')
     ```
@@ -192,6 +198,9 @@ class AntMazeEnv(MazeEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('AntMaze_UMaze-v4', max_episode_steps=100)
     ```
@@ -319,3 +328,11 @@ def render(self):
     def close(self):
         super().close()
         self.ant_env.close()
+
+    @property
+    def model(self):
+        return self.ant_env.model
+
+    @property
+    def data(self):
+        return self.ant_env.data
diff --git a/gymnasium_robotics/envs/maze/point_maze.py b/gymnasium_robotics/envs/maze/point_maze.py
index 33b263e7..e655f628 100644
--- a/gymnasium_robotics/envs/maze/point_maze.py
+++ b/gymnasium_robotics/envs/maze/point_maze.py
@@ -196,6 +196,9 @@ class PointMazeEnv(MazeEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     example_map = [[1, 1, 1, 1, 1],
            [1, C, 0, C, 1],
@@ -253,6 +256,9 @@ class PointMazeEnv(MazeEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('PointMaze_UMazeDense-v3')
     ```
@@ -286,6 +292,9 @@ class PointMazeEnv(MazeEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('PointMaze_UMaze-v3', max_episode_steps=100)
     ```
@@ -415,3 +424,11 @@ def render(self):
     def close(self):
         super().close()
         self.point_env.close()
+
+    @property
+    def model(self):
+        return self.point_env.model
+
+    @property
+    def data(self):
+        return self.point_env.data
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/mujoco_multi.py b/gymnasium_robotics/envs/multiagent_mujoco/mujoco_multi.py
index 76d99a4e..0d671d16 100755
--- a/gymnasium_robotics/envs/multiagent_mujoco/mujoco_multi.py
+++ b/gymnasium_robotics/envs/multiagent_mujoco/mujoco_multi.py
@@ -20,7 +20,7 @@
 import gymnasium
 import numpy as np
 import pettingzoo
-from gymnasium.wrappers.time_limit import TimeLimit
+from gymnasium.wrappers import TimeLimit
 
 from gymnasium_robotics.envs.multiagent_mujoco.coupled_half_cheetah import (
     CoupledHalfCheetahEnv,
diff --git a/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_block.py b/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_block.py
index f0ffe70c..bd82c3d4 100644
--- a/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_block.py
+++ b/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_block.py
@@ -166,6 +166,9 @@ class MujocoHandBlockEnv(MujocoManipulateEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('HandManipulateBlock-v1')
     ```
@@ -193,6 +196,9 @@ class MujocoHandBlockEnv(MujocoManipulateEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('HandManipulateBlock-v1', max_episode_steps=100)
     ```
@@ -203,7 +209,6 @@ class MujocoHandBlockEnv(MujocoManipulateEnv, EzPickle):
 
     * v1: the environment depends on the newest [mujoco python bindings](https://mujoco.readthedocs.io/en/latest/python.html) maintained by the MuJoCo team in Deepmind.
     * v0: the environment depends on `mujoco_py` which is no longer maintained.
-
     """
 
     def __init__(
diff --git a/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_egg.py b/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_egg.py
index fab89d99..d0f6f0d8 100644
--- a/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_egg.py
+++ b/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_egg.py
@@ -169,6 +169,9 @@ class MujocoHandEggEnv(MujocoManipulateEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('HandManipulateEgg-v1')
     ```
@@ -196,6 +199,9 @@ class MujocoHandEggEnv(MujocoManipulateEnv, EzPickle):
 
     ```
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('HandManipulateEgg-v1', max_episode_steps=100)
     ```
diff --git a/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_pen.py b/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_pen.py
index 03682268..b9f9fb35 100644
--- a/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_pen.py
+++ b/gymnasium_robotics/envs/shadow_dexterous_hand/manipulate_pen.py
@@ -168,6 +168,9 @@ class MujocoHandPenEnv(MujocoManipulateEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('HandManipulatePen-v1')
     ```
@@ -195,6 +198,9 @@ class MujocoHandPenEnv(MujocoManipulateEnv, EzPickle):
 
     ```python
     import gymnasium as gym
+    import gymnasium_robotics
+
+    gym.register_envs(gymnasium_robotics)
 
     env = gym.make('HandManipulatePen-v1', max_episode_steps=100)
     ```
@@ -205,7 +211,6 @@ class MujocoHandPenEnv(MujocoManipulateEnv, EzPickle):
 
     * v1: the environment depends on the newest [mujoco python bindings](https://mujoco.readthedocs.io/en/latest/python.html) maintained by the MuJoCo team in Deepmind.
     * v0: the environment depends on `mujoco_py` which is no longer maintained.
-
     """
 
     def __init__(
diff --git a/pyproject.toml b/pyproject.toml
index 3e482142..4c4961d5 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -24,9 +24,9 @@ classifiers = [
     'Topic :: Scientific/Engineering :: Artificial Intelligence',
 ]
 dependencies = [
-    "mujoco>=2.3.3, <3.0",
+    "mujoco>=2.2.0",
     "numpy>=1.21.0",
-    "gymnasium>=0.26",
+    "gymnasium>=1.0.0a1",
     "PettingZoo>=1.23.0",
     "Jinja2>=3.0.3",
     "imageio"
diff --git a/tests/envs/franka_kitchen/test_kitchen_env.py b/tests/envs/franka_kitchen/test_kitchen_env.py
index e6616cf6..4c3f92b4 100644
--- a/tests/envs/franka_kitchen/test_kitchen_env.py
+++ b/tests/envs/franka_kitchen/test_kitchen_env.py
@@ -47,7 +47,7 @@ def test_task_completion(remove_task_when_completed, terminate_on_tasks_complete
         # Complete a task sequentially for each environment step
         for task in TASKS:
             # Force task to be achieved
-            env.data.qpos[OBS_ELEMENT_INDICES[task]] = OBS_ELEMENT_GOALS[task]
+            env.unwrapped.data.qpos[OBS_ELEMENT_INDICES[task]] = OBS_ELEMENT_GOALS[task]
             _, _, terminated, _, info = env.step(env.action_space.sample())
             completed_tasks.add(task)
 
@@ -91,7 +91,7 @@ def test_task_completion(remove_task_when_completed, terminate_on_tasks_complete
         # Complete a task sequentially for each environment step
         for task in TASKS:
             # Force task to be achieved
-            env.data.qpos[OBS_ELEMENT_INDICES[task]] = OBS_ELEMENT_GOALS[task]
+            env.unwrapped.data.qpos[OBS_ELEMENT_INDICES[task]] = OBS_ELEMENT_GOALS[task]
             completed_tasks.add(task)
 
         _, _, terminated, _, info = env.step(env.action_space.sample())
diff --git a/tests/envs/hand/test_manipulate.py b/tests/envs/hand/test_manipulate.py
index e1afe251..c27b3d5a 100644
--- a/tests/envs/hand/test_manipulate.py
+++ b/tests/envs/hand/test_manipulate.py
@@ -16,7 +16,7 @@ def test_serialize_deserialize(environment_id):
     env1.reset()
     env2 = pickle.loads(pickle.dumps(env1))
 
-    assert env1.target_position == env2.target_position, (
+    assert env1.unwrapped.target_position == env2.unwrapped.target_position, (
         env1.target_position,
         env2.target_position,
     )
diff --git a/tests/envs/hand/test_manipulate_touch_sensors.py b/tests/envs/hand/test_manipulate_touch_sensors.py
index 4cda849d..f741e3f4 100644
--- a/tests/envs/hand/test_manipulate_touch_sensors.py
+++ b/tests/envs/hand/test_manipulate_touch_sensors.py
@@ -16,7 +16,7 @@ def test_serialize_deserialize(environment_id):
     env1.reset()
     env2 = pickle.loads(pickle.dumps(env1))
 
-    assert env1.target_position == env2.target_position, (
+    assert env1.unwrapped.target_position == env2.unwrapped.target_position, (
         env1.target_position,
         env2.target_position,
     )
diff --git a/tests/envs/hand/test_reach.py b/tests/envs/hand/test_reach.py
index 6596aa12..7cf93665 100644
--- a/tests/envs/hand/test_reach.py
+++ b/tests/envs/hand/test_reach.py
@@ -8,7 +8,7 @@ def test_serialize_deserialize():
     env1.reset()
     env2 = pickle.loads(pickle.dumps(env1))
 
-    assert env1.distance_threshold == env2.distance_threshold, (
+    assert env1.unwrapped.distance_threshold == env2.unwrapped.distance_threshold, (
         env1.distance_threshold,
         env2.distance_threshold,
     )
diff --git a/tests/test_envs.py b/tests/test_envs.py
index 6fc05928..472652c3 100644
--- a/tests/test_envs.py
+++ b/tests/test_envs.py
@@ -14,7 +14,7 @@
     for message in [
         "This version of the mujoco environments depends on the mujoco-py bindings, which are no longer maintained and may stop working. Please upgrade to the v4 versions of the environments (which depend on the mujoco python bindings instead), unless you are trying to precisely replicate previous works).",
         "A Box observation space minimum value is -infinity. This is probably too low.",
-        "A Box observation space maximum value is -infinity. This is probably too high.",
+        "A Box observation space maximum value is infinity. This is probably too high.",
         "For Box action spaces, we recommend using a symmetric and normalized space (range=[-1, 1] or [0, 1]). See https://stable-baselines3.readthedocs.io/en/master/guide/rl_tips.html for more information.",
     ]
 ]

From 8606192735a9963d1dcc12feade037b77d9349be Mon Sep 17 00:00:00 2001
From: Kallinteris Andreas
 <30759571+Kallinteris-Andreas@users.noreply.github.com>
Date: Mon, 19 Feb 2024 18:36:26 +0200
Subject: [PATCH 3/4] add `MaMuJoCo-v1` environments (#196)

* (temp) make mamujoco requirement mandatory

* MaMuJoCo Doc update

* add ant2x4 image

* `MaMuJoCo` DOC Update (adding action space PICs)

* more pics

* typo fix

* typo fixes

* fix `shinx` warning

* `MaMuJoCo` DOC update

* minor formating changes

* add `kwargs`

* add `mujuco-v5` (init)

* `pre-commit`

* add hopper_v5

* add walker2d

* add Half Cheetah

* typo fix

* add pusher

* add swimmer

* pre-commit

* typo fix

* `xml_file` arg fixes

* added `InvertedPendulum-v5`

* cleanup

* rename

* fix camera on new models

* add inv_double_pend

* fix `humanoid` `info`

* `humanoid` add include obs arguments

* update reacher DOC

* update obs shape (humanoid)

* `Ant` cleanup and fix `info`

* update `Ant` doc

* re-add to humanoid `contact_cost`

* fix obs shape

* inv_double_pend update doc

* Ant doc update

* reacher add changelogg

* `xml_file` doc fix for hopper and walker

* update humanoid doc

* Ant obs doc fix

* add `__credits__`

* `pre-commit`

* doc update

* doc args cleanup

* fix pusher changelogs

* `reacher` & `pusher` add xml_file argument

* fix typos in `humanoid`

* rename obs args

* ant add `include_cfrc_ext_in_observation`

* register new envs

* fix register

* typo fix

* fix humanoid pickle

* fix humanoid pickle (for real this time)

* add `reset_noise_scale` to double_pend

* add new inv_double_pend args

* inv_double_pend re_order ez pickle init to the start

* add humanoidstandup

* update humanoid standup `info`

* `pre-commit`

* cleanup

* hopper add `info` "z_distance_from_origin"

* fix

* add `frame_skip` argument

* add tendon `info`

* fix exclude refactor

* update doc

* update obs creation

* typo fix

* cleanup

* fixed humanoid arguments docs

* add dynamic obs_size calculation

* add `metadata["observation_structure"]`

* cartpole add args

* typo fix

* added `reacher`&`pusher` reward weights

* cleanup

* cleanup

* cleanup

* `pre-commit`

* add `default_camera_config` argunment

* fix `ant/humanoid` `info["x/y_position"]`

* `ant` add `forward_reward_weight`

* ant doc

* `ant` cleaned up xy pos aquasition

* added `main_body`

* fix `healthy_reward`

* pre-commit

* fix ant velocity

* dict

* update renderer

* add `walker2d` `info[z_distance_from_origon]`

* add `reset_info`

* refactored observation structures to a member variable

* cleanup observation_structure

* Final? documention update

* cleanup

* fix distance_from_origin info

* pre-commit

* Update maze_v4.py

* cleanup

* cleanup

* clean

* cleaup local/global cat generation

* remove `osbk._observation_structure`

* type hint adition

* doc typo fix

* more to `gymnasium/mujoco-v5`

* disable const 0 observation (`Ant`&`Humanoid`)

* port to v5 (missed one)

* `dummy_node`, when `factorizatoion=None` now includes action_id

* update `map_global_state_to_local_observations` for `v5`

* fix `Walker2d` globals from `[root_x, root_x, root_z]` to `[root_x, root_z, root_y]`

* add `ignore_body_fn` in `build_obs`

* enchance observation mapping

* fix map_obs_local2global error msg

* remove `ManySegment` classes

* rename to `v1`

* update docstrings

* cleanup

* add support for loading custom envs

* cleanup

* cleanup

* fixed temp assets not being removed

* fix stupid bug

* update manysegswimmer timestep to match swimmer

* update swimmer to support `mujoco>=3.0.0`

* change manysegmentant timestep

* add test for many segment swimmer

* expand testing to include different obs types

* add a comment

* factorization and cleanup

* `gymnasium==1.0.0` compatibility

* `gymnasium==1.0.0` API

* updated documention

* update single

* make `jinja2` optional and cleanup

* add multiswimmer doc

* Update pyproject.tom

* Update pyproject.toml

* Update __init__.py

* Update __init__.py

* `pre-commit`

* Update index.md

* Update many_segment_swimmer.py

* Update many_segment_ant.py

* Update ma_ant.md

* Update ma_coupled_half_cheetah.md

* Update ma_half_cheetah.md

* Update ma_hopper.md

* Update ma_humanoid.md

* Update ma_humanoid_standup.md

* Update ma_multiagentswimmer.md

* Update ma_pusher.md

* Update ma_reacher.md

* Update ma_single.md

* Update ma_swimmer.md

* Update ma_walker2d.md

* Update README.md
---
 README.md                                     |   2 +
 docs/envs/MaMuJoCo/index.md                   |  31 +-
 docs/envs/MaMuJoCo/ma_ant.md                  |  20 +-
 docs/envs/MaMuJoCo/ma_coupled_half_cheetah.md |  10 +-
 docs/envs/MaMuJoCo/ma_half_cheetah.md         |  12 +-
 docs/envs/MaMuJoCo/ma_hopper.md               |  10 +-
 docs/envs/MaMuJoCo/ma_humanoid.md             |  11 +-
 docs/envs/MaMuJoCo/ma_humanoid_standup.md     |  11 +-
 docs/envs/MaMuJoCo/ma_multiagentswimmer.md    |  81 ++++
 docs/envs/MaMuJoCo/ma_pusher.md               |  10 +-
 docs/envs/MaMuJoCo/ma_reacher.md              |  10 +-
 docs/envs/MaMuJoCo/ma_single.md               |   6 +-
 docs/envs/MaMuJoCo/ma_swimmer.md              |  10 +-
 docs/envs/MaMuJoCo/ma_walker2d.md             |  11 +-
 gymnasium_robotics/__init__.py                |   4 +-
 .../envs/multiagent_mujoco/__init__.py        |   6 -
 .../assets/many_segment_ant.xml.template      |   8 +-
 .../assets/many_segment_swimmer.xml.template  |  13 +-
 .../multiagent_mujoco/coupled_half_cheetah.py |   4 +-
 .../{mamujoco_v0.py => mamujoco_v1.py}        |   0
 .../multiagent_mujoco/many_segment_ant.py     | 233 +++--------
 .../multiagent_mujoco/many_segment_swimmer.py | 197 +++------
 .../envs/multiagent_mujoco/mujoco_multi.py    | 376 +++++++++++-------
 .../envs/multiagent_mujoco/obsk.py            | 128 ++----
 tests/envs/MaMuJoCo/test_MaMuJoCo.py          | 178 ++++++---
 25 files changed, 674 insertions(+), 708 deletions(-)
 create mode 100644 docs/envs/MaMuJoCo/ma_multiagentswimmer.md
 rename gymnasium_robotics/envs/multiagent_mujoco/{mamujoco_v0.py => mamujoco_v1.py} (100%)

diff --git a/README.md b/README.md
index 403ec1dc..c8d0031d 100644
--- a/README.md
+++ b/README.md
@@ -32,6 +32,8 @@ The [D4RL](https://github.com/Farama-Foundation/D4RL) environments are now avail
 The different tasks involve hammering a nail, opening a door, twirling a pen, or picking up and moving a ball.
 * [Franka Kitchen](https://robotics.farama.org/envs/franka_kitchen/) - Multitask environment in which a 9-DoF Franka robot is placed in a kitchen containing several common household items. The goal of each task is to interact with the items in order to reach a desired goal configuration.
 
+* [MaMuJoCo](https://robotics.farama.org/envs/MaMuJoCo/) - A collection of multi agent factorizations of the [Gymnasium/MuJoCo](https://gymnasium.farama.org/environments/mujoco/) environments and a framework for factorizing robotic environments, uses the [pettingzoo.ParallelEnv](https://pettingzoo.farama.org/api/parallel/) API. 
+
 **WIP**: generate new `D4RL` environment datasets with [Minari](https://github.com/Farama-Foundation/Minari).
 
 ## Multi-goal API
diff --git a/docs/envs/MaMuJoCo/index.md b/docs/envs/MaMuJoCo/index.md
index b70a16a5..94d2b9b0 100644
--- a/docs/envs/MaMuJoCo/index.md
+++ b/docs/envs/MaMuJoCo/index.md
@@ -19,20 +19,19 @@ Gymansium-Robotics/MaMuJoCo Represents the first, easy to use Framework for rese
 MaMuJoCo mainly uses the [PettingZoo.ParallelAPI](https://pettingzoo.farama.org/api/parallel/), but also supports a few extra functions:
 
 ```{eval-rst}
-.. autofunction:: gymnasium_robotics.mamujoco_v0.parallel_env.map_local_actions_to_global_action
+.. autofunction:: gymnasium_robotics.mamujoco_v1.parallel_env.map_local_actions_to_global_action
 ```
-
 ```{eval-rst}
-.. autofunction:: gymnasium_robotics.mamujoco_v0.parallel_env.map_global_action_to_local_actions
+.. autofunction:: gymnasium_robotics.mamujoco_v1.parallel_env.map_global_action_to_local_actions
 ```
 ```{eval-rst}
-.. autofunction:: gymnasium_robotics.mamujoco_v0.parallel_env.map_global_state_to_local_observations
+.. autofunction:: gymnasium_robotics.mamujoco_v1.parallel_env.map_global_state_to_local_observations
 ```
 ```{eval-rst}
-.. autofunction:: gymnasium_robotics.mamujoco_v0.parallel_env.map_local_observation_to_global_state
+.. autofunction:: gymnasium_robotics.mamujoco_v1.parallel_env.map_local_observations_to_global_state
 ```
 ```{eval-rst}
-.. autofunction:: gymnasium_robotics.mamujoco_v0.get_parts_and_edges
+.. autofunction:: gymnasium_robotics.mamujoco_v1.get_parts_and_edges
 ```
 
 MaMuJoCo also supports the [PettingZoo.AECAPI](https://pettingzoo.farama.org/api/aec/) but does not expose extra functions.
@@ -41,19 +40,19 @@ MaMuJoCo also supports the [PettingZoo.AECAPI](https://pettingzoo.farama.org/api
 
 ### Arguments
 ```{eval-rst}
-.. autofunction:: gymnasium_robotics.mamujoco_v0.parallel_env.__init__
+.. autofunction:: gymnasium_robotics.mamujoco_v1.parallel_env.__init__
 ```
 
 
 
 ## How to create new agent factorizations 
-### example 'Ant-v4', '8x1'
+### example 'Ant-v5', '8x1'
 In this example, we will create an agent factorization not present in Gymnasium-Robotics/MaMuJoCo the "Ant"/'8x1', where each agent controls a single joint/action (first implemented by [safe-MaMuJoCo](https://github.com/chauncygu/Safe-Multi-Agent-Mujoco)).
 
 first we will load the graph of MaMuJoCo:
 ```python
->>> from gymnasium_robotics.mamujoco_v0 import get_parts_and_edges
->>> unpartioned_nodes, edges, global_nodes = get_parts_and_edges('Ant-v4', None)
+>>> from gymnasium_robotics.mamujoco_v1 import get_parts_and_edges
+>>> unpartioned_nodes, edges, global_nodes = get_parts_and_edges('Ant-v5', None)
 ```
 The `unpartioned_nodes` contain the nodes of the MaMuJoCo graph.
 The `edges` well, contain the edges of the graph.
@@ -63,18 +62,23 @@ To create our '8x1' partition we will need to partition the `unpartioned_nodes`:
 ```python
 >>> unpartioned_nodes
 [(hip1, ankle1, hip2, ankle2, hip3, ankle3, hip4, ankle4)]
->>> partioned_nodes = [(unpartioned_nodes[0][0],), (unpartioned_nodes[0][1],), (unpartioned_nodes[0][2],), (unpartioned_nodes[0][3],), (unpartioned_nodes[0][4],), (unpartioned_nodes[0][5],), (unpartioned_nodes[0][6],), (unpartioned_nodes[0][7],)]>>> partioned_nodes
+>>> partioned_nodes = [(unpartioned_nodes[0][0],), (unpartioned_nodes[0][1],), (unpartioned_nodes[0][2],), (unpartioned_nodes[0][3],), (unpartioned_nodes[0][4],), (unpartioned_nodes[0][5],), (unpartioned_nodes[0][6],), (unpartioned_nodes[0][7],)]
 >>> partioned_nodes
 [(hip1,), (ankle1,), (hip2,), (ankle2,), (hip3,), (ankle3,), (hip4,), (ankle4,)]
 ```
 Finally package the partitions and create our environment:
 ```python
 >>> my_agent_factorization = {"partition": partioned_nodes, "edges": edges, "globals": global_nodes}
->>> gym_env = mamujoco_v0('Ant', '8x1', agent_factorization=my_agent_factorization)
+>>> gym_env = mamujoco_v1('Ant', '8x1', agent_factorization=my_agent_factorization)
 ```
 
 ## Version History
-v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of [the original multiagent_mujuco](https://github.com/schroederdewitt/multiagent_mujoco)
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
+	- When `factorizatoion=None`, the `env.gent_action_partitions.dummy_node` now contains `action_id` (it used to be `None`).
+	- Added `map_local_observations_to_global_state` & optimized runtime performance of `map_global_state_to_local_observations`.
+	- Added `gym_env` argument which can be used to load third-party `Gymansium.MujocoEnv` environments.
+* v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of [the original multiagent_mujuco](https://github.com/schroederdewitt/multiagent_mujoco)
 
 ```{toctree}
 :hidden:
@@ -84,6 +88,7 @@ ma_half_cheetah.md
 ma_hopper.md
 ma_humanoid_standup.md
 ma_humanoid.md
+ma_multiagentswimmer.md
 ma_reacher.md
 ma_swimmer.md
 ma_pusher.md
diff --git a/docs/envs/MaMuJoCo/ma_ant.md b/docs/envs/MaMuJoCo/ma_ant.md
index d1bb06f4..150de59a 100644
--- a/docs/envs/MaMuJoCo/ma_ant.md
+++ b/docs/envs/MaMuJoCo/ma_ant.md
@@ -15,7 +15,7 @@ This Environment is part of [MaMuJoCo](https://robotics.farama.org/envs/MaMuJoCo
 The task is [Gymansium's MuJoCo/Ant](https://gymnasium.farama.org/environments/mujoco/ant/).
 
 
-| Defaults		| `env = mamujoco_v0.parallel_env("Ant", None)`		|
+| Defaults		| `env = mamujoco_v1.parallel_env("Ant", None)`		|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -23,14 +23,14 @@ The task is [Gymansium's MuJoCo/Ant](https://gymnasium.farama.org/environments/m
 | Part partition	| `[(hip4, ankle4, hip1, ankle1, hip2, ankle2, hip3, ankle3)]`	|
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/ant.png
     :name: ant
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Ant", None)`		|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Ant", None)`		|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -56,7 +56,7 @@ If partitioning, is None then the environment contains a single agent with the s
     :name: ant_2x4
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Ant", "2x4")`		|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Ant", "2x4")`		|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`					|
 | Number of Agents	| 2							|
@@ -86,7 +86,7 @@ The environment is partitioned in 2 parts, the front part (containing the front
     :name: ant_2x4d
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Ant", "2x4d")`		|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Ant", "2x4d")`		|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`					|
 | Number of Agents	| 2							|
@@ -114,7 +114,7 @@ The environment is partitioned in 2 parts, split diagonally.
     :name: ant_4x2
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Ant", "4x2")`		|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Ant", "4x2")`		|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1', 'agent_2', 'agent_3']`			|
 | Number of Agents	| 4							|
@@ -168,7 +168,7 @@ All agents receive the same [Gymnasium's Ant](https://gymnasium.farama.org/envir
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Ant](https://gymnasium.farama.org/environments/mujoco/ant/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Ant](https://gymnasium.farama.org/environments/mujoco/ant/#starting-state).
 
 
 
@@ -178,7 +178,11 @@ All agent terminate and truncate at the same time given the same conditions as [
 
 
 ## Version History
-- v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
+	- Now observes `local_categories` of `cfrc_ext` by default (same as `Gymnasium/MuJoCo-v5/Ant`).
+	- Renamed global node `torso` → `root`.
+* v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Fixed diagonal factorization ("2x4d") not being diagonal.
 	- Fixed Global observations (The Ant's Torso: `rootx`, `rooty`, `rootz`) not being observed.
diff --git a/docs/envs/MaMuJoCo/ma_coupled_half_cheetah.md b/docs/envs/MaMuJoCo/ma_coupled_half_cheetah.md
index 3acaae3e..da6d89ef 100644
--- a/docs/envs/MaMuJoCo/ma_coupled_half_cheetah.md
+++ b/docs/envs/MaMuJoCo/ma_coupled_half_cheetah.md
@@ -11,14 +11,14 @@ The environment consists of 2 half cheetahs coupled by an elastic tendon.
 
 
 ## Action Space
-The action spaces is depended on the partitioning.
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/coupled_half_cheetah.png
     :name: coupled_half_cheetah
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("CoupledHalfCheetah", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("CoupledHalfCheetah", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -49,7 +49,7 @@ If partitioning, is `None`, then the environment contains a single agent with th
     :name: coupled_half_cheetah_1p1
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("CoupledHalfCheetah", "1p1")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("CoupledHalfCheetah", "1p1")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`			|
 | Number of Agents	| 2							|
@@ -98,7 +98,7 @@ All agents receive the same average reward of each cheetah.
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Half Cheetah](https://gymnasium.farama.org/environments/mujoco/half_cheetah/#starting-state) (but with 2 cheetahs).
+The starting state of the environment is the same as [Gymnasium's Half Cheetah](https://gymnasium.farama.org/environments/mujoco/half_cheetah/#starting-state) (but with 2 cheetahs).
 
 
 
@@ -108,6 +108,8 @@ All agent terminate and truncate at the same time, given the same conditions as
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Fixed action mapping of the second cheetah (It would previously not work)
diff --git a/docs/envs/MaMuJoCo/ma_half_cheetah.md b/docs/envs/MaMuJoCo/ma_half_cheetah.md
index 4f463b8e..88b4a364 100644
--- a/docs/envs/MaMuJoCo/ma_half_cheetah.md
+++ b/docs/envs/MaMuJoCo/ma_half_cheetah.md
@@ -17,14 +17,14 @@ The task is [Gymansium's MuJoCo/Half Cheetah](https://gymnasium.farama.org/envir
 
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/half_cheetah.png
     :name: half_cheetah
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("HalfCheetah", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("HalfCheetah", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -47,7 +47,7 @@ If partitioning, is `None`, then the environment contains a single agent with th
     :name: half_cheetah_2x3
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("HalfCheetah", "2x3")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("HalfCheetah", "2x3")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`					|
 | Number of Agents	| 2							|
@@ -75,7 +75,7 @@ The environment is partitioned in 2 parts, the front part (containing the front
     :name: half_cheetah_6x1
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("HalfCheetah", "6x1")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("HalfCheetah", "6x1")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1', 'agent_2', 'agent_3', 'agent_4', 'agent_5']`			|
 | Number of Agents	| 6							|
@@ -129,7 +129,7 @@ All agents receive the same [Gymnasium's Half Cheetah](https://gymnasium.farama.
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Half Cheetah](https://gymnasium.farama.org/environments/mujoco/half_cheetah/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Half Cheetah](https://gymnasium.farama.org/environments/mujoco/half_cheetah/#starting-state).
 
 
 
@@ -138,6 +138,8 @@ All agent terminate and truncate at the same time, given the same conditions as
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Added/Fixed Global observations (The Cheetah's front tip: `rootx`, `rooty`, `rootz`) not being observed.
diff --git a/docs/envs/MaMuJoCo/ma_hopper.md b/docs/envs/MaMuJoCo/ma_hopper.md
index bc27fb69..40bbf6f0 100644
--- a/docs/envs/MaMuJoCo/ma_hopper.md
+++ b/docs/envs/MaMuJoCo/ma_hopper.md
@@ -17,14 +17,14 @@ The task is [Gymansium's MuJoCo/Hopper](https://gymnasium.farama.org/environment
 
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/hopper.png
     :name: hopper
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Hopper", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Hopper", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -47,7 +47,7 @@ If partitioning, is `None`, then the environment contains a single agent with th
     :name: hopper_3x1
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Hopper", "3x1")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Hopper", "3x1")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1', 'agent_2']`			|
 | Number of Agents	| 3							|
@@ -89,7 +89,7 @@ All agents receive the same [Gymnasium's Hopper](https://gymnasium.farama.org/en
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Hopper](https://gymnasium.farama.org/environments/mujoco/hopper/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Hopper](https://gymnasium.farama.org/environments/mujoco/hopper/#starting-state).
 
 
 
@@ -98,6 +98,8 @@ All agent terminate and truncate at same time given the same conditions as [Gymn
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Fixed Global observations (The Hopper's top: `rootx`, `rooty`, `rootz`) not being observed.
diff --git a/docs/envs/MaMuJoCo/ma_humanoid.md b/docs/envs/MaMuJoCo/ma_humanoid.md
index 52291ad9..47d8afa2 100644
--- a/docs/envs/MaMuJoCo/ma_humanoid.md
+++ b/docs/envs/MaMuJoCo/ma_humanoid.md
@@ -17,14 +17,14 @@ The task is [Gymansium's MuJoCo/Humanoid](https://gymnasium.farama.org/environme
 
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/humanoid.png
     :name: humanoid
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Humanoid", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Humanoid", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -60,7 +60,7 @@ If partitioning, is `None` then the environment contains a single agent with the
     :name: humanoid_9|8
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Humanoid", "3x1")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Humanoid", "3x1")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`			|
 | Number of Agents	| 2							|
@@ -114,7 +114,7 @@ All agents receive the same [Gymnasium's Humanoid](https://gymnasium.farama.org/
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Humanoid](https://gymnasium.farama.org/environments/mujoco/humanoid/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Humanoid](https://gymnasium.farama.org/environments/mujoco/humanoid/#starting-state).
 
 
 
@@ -123,6 +123,9 @@ All agent terminate and truncate at the same time, given the same conditions as
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
+	- No longer observes `qfrc_actuator` of `root` & `cinert`, `cvel`, `qfrc_actuator`, `cfrc_ext` of `worldbody` (same as `Gymnasium/MuJoCo-v5/Humanoid`).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Added/Fixed Global observations (The Humanoids's torso: `rootx`, `rooty`, `rootz`) not being observed.
diff --git a/docs/envs/MaMuJoCo/ma_humanoid_standup.md b/docs/envs/MaMuJoCo/ma_humanoid_standup.md
index 55369e1c..d330a7f4 100644
--- a/docs/envs/MaMuJoCo/ma_humanoid_standup.md
+++ b/docs/envs/MaMuJoCo/ma_humanoid_standup.md
@@ -17,14 +17,14 @@ The task is [Gymansium's MuJoCo/Humanoid Standup](https://gymnasium.farama.org/e
 
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/humanoid.png
     :name: humanoid
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("HumanoidStandup", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("HumanoidStandup", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -60,7 +60,7 @@ If partitioning, is `None` then the environment contains a single agent with the
     :name: humanoid_9|8
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("HumanoidStandup", "3x1")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("HumanoidStandup", "3x1")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`			|
 | Number of Agents	| 2							|
@@ -114,7 +114,7 @@ All agents receive the same [Gymnasium's Humanoid Standup](https://gymnasium.far
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Humanoid Standup](https://gymnasium.farama.org/environments/mujoco/humanoid_standup/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Humanoid Standup](https://gymnasium.farama.org/environments/mujoco/humanoid_standup/#starting-state).
 
 
 
@@ -123,6 +123,9 @@ All agent terminate and truncate at the same time, given the same conditions as
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
+	- No longer observes `qfrc_actuator` of `root` & `cinert`, `cvel`, `qfrc_actuator`, `cfrc_ext` of `worldbody` (same as `Gymnasium/MuJoCo-v5/HumanoidStandup`).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Added/Fixed Global observations (The Humanoids's torso: `rootx`, `rooty`, `rootz`) not being observed.
diff --git a/docs/envs/MaMuJoCo/ma_multiagentswimmer.md b/docs/envs/MaMuJoCo/ma_multiagentswimmer.md
new file mode 100644
index 00000000..ce3657ca
--- /dev/null
+++ b/docs/envs/MaMuJoCo/ma_multiagentswimmer.md
@@ -0,0 +1,81 @@
+---
+firstpage:
+lastpage:
+---
+ManySegmentSwimmer
+
+# Swimmer
+```{figure} figures/many_segment_swimmer.png
+    :name: many_segment_swimmer
+```
+
+
+This Environment is part of [MaMuJoCo](https://robotics.farama.org/envs/MaMuJoCo/) environments. Please read that page first for general information.
+The task is variation of [Gymansium's MuJoCo/Swimmer](https://gymnasium.farama.org/environments/mujoco/swimmer/), which instead of having 2 segments, it has configurable amount of segments.
+
+The task was first introduced by Christian A. Schroeder de Witt in ["FACMAC: Factored Multi-Agent Centralised Policy Gradients"](https://arxiv.org/abs/2003.06709)
+
+
+## Action Space
+The shape of the action space depends on the partitioning. The partitioning has the following form: `${Number Of Agents}x${Number Of Segments per Agent}`
+
+| Instantiate		| `env = mamujoco_v1.parallel_env("ManySegmentSwimmer", ${Number Of Agents}x${Number Of Segments per Agent})`	|
+|-----------------------|------------------------------------------------------|
+| Agents		| `agents= ['agent_0', ..., 'agent_${Number Of Agents}']`					|
+| Number of Agents	| `${Number Of Agents}`						|
+| Action Spaces		| `{${agents} : Box(-1, 1, (${Number Of Segments per Agent},), float32)}`			|
+| Part partition	| `(joint0, joint1,)`	|
+
+The environment is partitioned in `${Number Of Agents}` parts, with each part corresponding to `${Number Of Segments per Agent}` joints.
+
+#### Agent 0 action space
+| Num | Action                             | Control Min | Control Max | Name (in corresponding XML file) | Joint | Unit         |
+|-----|------------------------------------|-------------|-------------|----------------------------------|-------|--------------|
+| 0   | Torque applied on the first rotor  | -1          | 1           | motor1_rot                       | hinge | torque (N m) |
+| 1   | Torque applied on the second rotor | -1          | 1           | motor2_rot                       | hinge | torque (N m) |
+| ... | ...                                | -1          | 1           | ...                              | hinge | torque (N m) |
+| `${Number Of Segments per Agent}` | Torque applied on the agent's last rotor | -1          | 1           | motor`${Number Of Segments per Agent}`_rot                       | hinge | torque (N m) |
+#### Agent 1 action space
+| Num | Action                             | Control Min | Control Max | Name (in corresponding XML file) | Joint | Unit         |
+|-----|------------------------------------|-------------|-------------|----------------------------------|-------|--------------|
+| 0   | Torque applied on the `${Number Of Segments per Agent}` rotor | -1          | 1           | ??? | hinge | torque (N m) |
+| ... | ...                                | -1          | 1           | ...                              | hinge | torque (N m) |
+| `${Number Of Segments per Agent}` | Torque applied on the agent's last rotor | -1          | 1           | motor`2x${Number Of Segments per Agent}`_rot                       | hinge | torque (N m) |
+#### Agent ... action space
+...
+
+
+
+## Observation Space
+| Observation Categories ||
+|-----------------------|------------------------------------------------------|			
+| Default `local_categories` | `[["qpos", "qvel"], ["qpos"]]` |
+| Default `global_categories` | `("qpos", "qvel")` |
+| Supported observation categories | `"qpos", "qvel"` |
+
+Besides the local observation of each agent (which depend on their parts of the agent, the observation categories and the observation depth), each agent also observes the position and velocity items of the swimmer's tip.
+See more at the [Gymnasium's Swimmer](https://gymnasium.farama.org/environments/mujoco/swimmer/#observation-space).
+
+
+
+## Rewards
+All agents receive the same [Gymnasium's Swimmer](https://gymnasium.farama.org/environments/mujoco/swimmer/#observation-space) reward.
+
+
+
+## Starting state
+The starting state of the environment is the same as [Gymnasium's Swimmer](https://gymnasium.farama.org/environments/mujoco/swimmer/#starting-state).
+
+
+
+## Episode End
+All agent terminate and truncate at the same time, given the same conditions as [Gymnasium's Swimmer](https://gymnasium.farama.org/environments/mujoco/swimmer/#episode-end).
+
+
+## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
+	- Now uses the same `option.timestep` as `Gymansum/Swimmer` (0.01).
+	- Updated model to work with `mujoco>=3.0.0`.
+* v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
+
diff --git a/docs/envs/MaMuJoCo/ma_pusher.md b/docs/envs/MaMuJoCo/ma_pusher.md
index d4f92f30..1c45a1f2 100644
--- a/docs/envs/MaMuJoCo/ma_pusher.md
+++ b/docs/envs/MaMuJoCo/ma_pusher.md
@@ -17,14 +17,14 @@ The task is [Gymansium's MuJoCo/Pusher](https://gymnasium.farama.org/environment
 
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/pusher.png
     :name: pusher
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Pusher", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Pusher", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -50,7 +50,7 @@ If partitioning, is None then the environment contains a single agent with the s
     :name: pusher_3p
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Pusher", "3p")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Pusher", "3p")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`			|
 | Number of Agents	| 3							|
@@ -98,7 +98,7 @@ All agents receive the same [Gymnasium's Pusher](https://gymnasium.farama.org/en
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Pusher](https://gymnasium.farama.org/environments/mujoco/pusher/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Pusher](https://gymnasium.farama.org/environments/mujoco/pusher/#starting-state).
 
 
 
@@ -107,4 +107,6 @@ All agent terminate and truncate at same time given the same conditions as [Gymn
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), first implemented here.
diff --git a/docs/envs/MaMuJoCo/ma_reacher.md b/docs/envs/MaMuJoCo/ma_reacher.md
index 0bd613d9..a587e1c8 100644
--- a/docs/envs/MaMuJoCo/ma_reacher.md
+++ b/docs/envs/MaMuJoCo/ma_reacher.md
@@ -17,14 +17,14 @@ The task is [Gymansium's MuJoCo/Reacher](https://gymnasium.farama.org/environmen
 
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/reacher.png
     :name: reacher
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Reacher", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Reacher", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -45,7 +45,7 @@ If partitioning, is `None`, then the environment contains a single agent with th
     :name: reacher_2x1
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Reacher", "2x1")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Reacher", "2x1")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`			|
 | Number of Agents	| 2							|
@@ -84,7 +84,7 @@ All agents receive the same [Gymnasium's Reacher](https://gymnasium.farama.org/e
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Reacher](https://gymnasium.farama.org/environments/mujoco/reacher/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Reacher](https://gymnasium.farama.org/environments/mujoco/reacher/#starting-state).
 
 
 
@@ -93,6 +93,8 @@ All agent terminate and truncate at the same time, given the same conditions as
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Added/Fixed Global observations (The Targets's coordinates: `targetx`, `targety`) not being observed.
diff --git a/docs/envs/MaMuJoCo/ma_single.md b/docs/envs/MaMuJoCo/ma_single.md
index dab60914..599ce7d8 100644
--- a/docs/envs/MaMuJoCo/ma_single.md
+++ b/docs/envs/MaMuJoCo/ma_single.md
@@ -20,7 +20,7 @@ The Purpose of these is to allow researchers to debug multi-agent learning algor
 
 
 ## Action Space
-The action spaces is depended on the partitioning.
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ## Observation Space
 The agent receives the same observations as the single agent Gymnasium environment.
@@ -43,6 +43,8 @@ The agent terminates and truncates at the same time, given the same conditions a
 
 
 ## Version History
-v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of [the original multiagent_mujuco](https://github.com/schroederdewitt/multiagent_mujoco).
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
+* v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of [the original multiagent_mujuco](https://github.com/schroederdewitt/multiagent_mujoco).
 No Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)).
 
diff --git a/docs/envs/MaMuJoCo/ma_swimmer.md b/docs/envs/MaMuJoCo/ma_swimmer.md
index 97400b5c..0d066615 100644
--- a/docs/envs/MaMuJoCo/ma_swimmer.md
+++ b/docs/envs/MaMuJoCo/ma_swimmer.md
@@ -17,14 +17,14 @@ The task is [Gymansium's MuJoCo/Swimmer](https://gymnasium.farama.org/environmen
 
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/swimmer.png
     :name: swimmer
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Swimmer", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Swimmer", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -45,7 +45,7 @@ If partitioning, is `None` then the environment contains a single agent with the
     :name: swimmer_2x1
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Swimmer", "2x1")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Swimmer", "2x1")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`			|
 | Number of Agents	| 2							|
@@ -83,7 +83,7 @@ All agents receive the same [Gymnasium's Swimmer](https://gymnasium.farama.org/e
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Swimmer](https://gymnasium.farama.org/environments/mujoco/swimmer/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Swimmer](https://gymnasium.farama.org/environments/mujoco/swimmer/#starting-state).
 
 
 
@@ -92,6 +92,8 @@ All agent terminate and truncate at the same time, given the same conditions as
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Added/Fixed Global observations (The Swimmer's front tip: `free_body_rot`) not being observed.
diff --git a/docs/envs/MaMuJoCo/ma_walker2d.md b/docs/envs/MaMuJoCo/ma_walker2d.md
index e273e5c3..cfa7ef03 100644
--- a/docs/envs/MaMuJoCo/ma_walker2d.md
+++ b/docs/envs/MaMuJoCo/ma_walker2d.md
@@ -17,14 +17,14 @@ The task is [Gymansium's MuJoCo/Walker2D](https://gymnasium.farama.org/environme
 
 
 ## Action Space
-The action spaces is depended on the partitioning
+The shape of the action space depends on the partitioning. The partitioning has the following form:
 
 ### if partitioning is None:
 ```{figure} figures/walker2d.png
     :name: walker2d
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Walker2D", None)`	|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Walker2D", None)`	|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0']`					|
 | Number of Agents	| 1							|
@@ -49,7 +49,7 @@ If partitioning, is `None` then the environment contains a single agent with the
     :name: walker2d_2x3
 ```
 
-| Instantiate		| `env = mamujoco_v0.parallel_env("Walker2d", "2x3")`|
+| Instantiate		| `env = mamujoco_v1.parallel_env("Walker2d", "2x3")`|
 |-----------------------|------------------------------------------------------|
 | Agents		| `agents= ['agent_0', 'agent_1']`			|
 | Number of Agents	| 2							|
@@ -92,7 +92,7 @@ All agents receive the same [Gymnasium's Walker2D](https://gymnasium.farama.org/
 
 
 ## Starting state
-The starting state of the environment is the as [Gymnasium's Walker2D](https://gymnasium.farama.org/environments/mujoco/walker2d/#starting-state).
+The starting state of the environment is the same as [Gymnasium's Walker2D](https://gymnasium.farama.org/environments/mujoco/walker2d/#starting-state).
 
 
 
@@ -102,6 +102,9 @@ All agent terminate and truncate at the same time given the same conditions as [
 
 
 ## Version History
+* v1:
+	- Now based on `Gymnasium/MuJoCo-v5` instead of `Gymnasium/MuJoCo-v4` (https://github.com/Farama-Foundation/Gymnasium/pull/572).
+	- Fixed bug: global nodes are now `[root_x, root_z, root_y]` (used to be `[root_x, root_x, root_z]`).
 - v0: Initial version release, uses [Gymnasium.MuJoCo-v4](https://gymnasium.farama.org/environments/mujoco/), and is a fork of the original MaMuJoCo [schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco).
 Changes from the original `MaMuJoCo` ([schroederdewitt/multiagent_mujoco](https://github.com/schroederdewitt/multiagent_mujoco)):
 	- Added/Fixed Global observations (The Walker's top: `rootx`, `rooty`, `rootz`) not being observed.
diff --git a/gymnasium_robotics/__init__.py b/gymnasium_robotics/__init__.py
index 1b1c37d4..49c86374 100644
--- a/gymnasium_robotics/__init__.py
+++ b/gymnasium_robotics/__init__.py
@@ -3,9 +3,9 @@
 
 from gymnasium_robotics.core import GoalEnv
 from gymnasium_robotics.envs.maze import maps
-from gymnasium_robotics.envs.multiagent_mujoco import mamujoco_v0
+from gymnasium_robotics.envs.multiagent_mujoco import mamujoco_v1
 
-__version__ = "1.2.4"
+__version__ = "1.3.0a1"
 
 
 def register_robotics_envs():
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/__init__.py b/gymnasium_robotics/envs/multiagent_mujoco/__init__.py
index cf745d64..07eb2b5d 100644
--- a/gymnasium_robotics/envs/multiagent_mujoco/__init__.py
+++ b/gymnasium_robotics/envs/multiagent_mujoco/__init__.py
@@ -3,12 +3,6 @@
 from gymnasium_robotics.envs.multiagent_mujoco.coupled_half_cheetah import (  # noqa: F401
     CoupledHalfCheetahEnv,
 )
-from gymnasium_robotics.envs.multiagent_mujoco.many_segment_ant import (  # noqa: F401
-    ManySegmentAntEnv,
-)
-from gymnasium_robotics.envs.multiagent_mujoco.many_segment_swimmer import (  # noqa: F401
-    ManySegmentSwimmerEnv,
-)
 from gymnasium_robotics.envs.multiagent_mujoco.mujoco_multi import (  # noqa: F401
     MultiAgentMujocoEnv,
 )
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/assets/many_segment_ant.xml.template b/gymnasium_robotics/envs/multiagent_mujoco/assets/many_segment_ant.xml.template
index 3b6b4eb8..8bfc3308 100644
--- a/gymnasium_robotics/envs/multiagent_mujoco/assets/many_segment_ant.xml.template
+++ b/gymnasium_robotics/envs/multiagent_mujoco/assets/many_segment_ant.xml.template
@@ -1,7 +1,13 @@
+<!--
+Template model for `MultiSegmentAnt`, based on the work of de Witt
+modified by @kallinteris-andreas
+  - To not require `coordinate="global"`
+  - `option.timestep` set to `0.01` (same as `Gymnasium/Ant`).
+-->
 <mujoco model="ant">
   <size nconmax="200"/>
   <compiler angle="degree" coordinate="local" inertiafromgeom="true"/>
-  <option integrator="RK4" timestep="0.005"/>
+  <option integrator="RK4" timestep="0.01"/>
   <custom>
     <numeric data="0.0 0.0 0.55 1.0 0.0 0.0 0.0 0.0 1.0 0.0 -1.0 0.0 -1.0 0.0 1.0" name="init_qpos"/>
   </custom>
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/assets/many_segment_swimmer.xml.template b/gymnasium_robotics/envs/multiagent_mujoco/assets/many_segment_swimmer.xml.template
index 9fb49a95..cff01a49 100644
--- a/gymnasium_robotics/envs/multiagent_mujoco/assets/many_segment_swimmer.xml.template
+++ b/gymnasium_robotics/envs/multiagent_mujoco/assets/many_segment_swimmer.xml.template
@@ -1,8 +1,14 @@
+<!--
+Template model for `MultiSegmentAnt`, based on the work of de Witt
+modified by @kallinteris-andreas
+  - `option.timestep` set to `0.01` (same as `Gymnasium/Swimmer`).
+  - Updated to work with `mujoco>=3.0.0`
+-->
 <mujoco model="swimmer">
   <compiler angle="degree" coordinate="local" inertiafromgeom="true"/>
-  <option collision="predefined" density="4000" integrator="RK4" timestep="0.005" viscosity="0.1"/>
+  <option density="4000" integrator="RK4" timestep="0.01" viscosity="0.1"/>
   <default>
-    <geom conaffinity="1" condim="1" contype="1" material="geom" rgba="0.8 0.6 .4 1"/>
+    <geom conaffinity="0" condim="1" contype="0" material="geom" rgba="0.8 0.6 .4 1"/>
     <joint armature='0.1'  />
   </default>
   <asset>
@@ -14,9 +20,10 @@
   </asset>
   <worldbody>
     <light cutoff="100" diffuse="1 1 1" dir="-0 0 -1.3" directional="true" exponent="1" pos="0 0 1.3" specular=".1 .1 .1"/>
-    <geom conaffinity="1" condim="3" material="MatPlane" name="floor" pos="0 0 -0.1" rgba="0.8 0.9 0.8 1" size="40 40 0.1" type="plane"/>
+    <geom condim="3" material="MatPlane" name="floor" pos="0 0 -0.1" rgba="0.8 0.9 0.8 1" size="40 40 0.1" type="plane"/>
     <!--  ================= SWIMMER ================= /-->
     <body name="torso" pos="0 0 0">
+      <camera name="track" mode="trackcom" pos="0 -3 3" xyaxes="1 0 0 0 1 1"/>
       <geom density="1000" fromto="1.5 0 0 0.5 0 0" size="0.1" type="capsule"/>
       <joint axis="1 0 0" name="slider1" pos="0 0 0" type="slide"/>
       <joint axis="0 1 0" name="slider2" pos="0 0 0" type="slide"/>
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/coupled_half_cheetah.py b/gymnasium_robotics/envs/multiagent_mujoco/coupled_half_cheetah.py
index 07b27c25..c33eb70d 100644
--- a/gymnasium_robotics/envs/multiagent_mujoco/coupled_half_cheetah.py
+++ b/gymnasium_robotics/envs/multiagent_mujoco/coupled_half_cheetah.py
@@ -38,7 +38,7 @@ class CoupledHalfCheetahEnv(mujoco_env.MujocoEnv, EzPickle):
     | 0   | Torque applied on the back thigh rotor of the first cheetah   | -1          | 1           | bthigh0                          | hinge | torque (N m) |
     | 1   | Torque applied on the back shin rotor of the first cheetah    | -1          | 1           | bshin0                           | hinge | torque (N m) |
     | 2   | Torque applied on the back foot rotor of the first cheetah    | -1          | 1           | bfoot0                           | hinge | torque (N m) |
-    | 3   | Torque applied on the front thigh rotor of the first cheetah   | -1          | 1           | fthigh0                          | hinge | torque (N m) |
+    | 3   | Torque applied on the front thigh rotor of the first cheetah  | -1          | 1           | fthigh0                          | hinge | torque (N m) |
     | 4   | Torque applied on the front shin rotor of the first cheetah   | -1          | 1           | fshin0                           | hinge | torque (N m) |
     | 5   | Torque applied on the front foot rotor of the first cheetah   | -1          | 1           | ffoot0                           | hinge | torque (N m) |
     | 6   | Torque applied on the back thigh rotor of the second cheetah  | -1          | 1           | bthigh1                          | hinge | torque (N m) |
@@ -129,7 +129,7 @@ class CoupledHalfCheetahEnv(mujoco_env.MujocoEnv, EzPickle):
     No additional arguments are currently supported in pre-release.
 
     ## Version History
-    * pre_release: part of `Gymnasium-Robotics/mamujoco`
+    * pre_release: part of `Gymnasium-Robotics/MaMuJoCo`
     """
 
     metadata = {
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/mamujoco_v0.py b/gymnasium_robotics/envs/multiagent_mujoco/mamujoco_v1.py
similarity index 100%
rename from gymnasium_robotics/envs/multiagent_mujoco/mamujoco_v0.py
rename to gymnasium_robotics/envs/multiagent_mujoco/mamujoco_v1.py
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/many_segment_ant.py b/gymnasium_robotics/envs/multiagent_mujoco/many_segment_ant.py
index be394f35..39f9ab3c 100644
--- a/gymnasium_robotics/envs/multiagent_mujoco/many_segment_ant.py
+++ b/gymnasium_robotics/envs/multiagent_mujoco/many_segment_ant.py
@@ -5,196 +5,79 @@
 Original Author: Schroeder de Witt
 
  - General code cleanup, factorization, type hinting, adding documentation and comments
- - updated API to Gymnasium.MuJoCo v4
- - increase returned info
- - renamed ManyAgentAntEnv -> ManySegmentAntEnv (and changed the __init__ arguments accordingly)
+ - Removed the class (but kept the `gen_asset` function)
 """
 
 import os
-import typing
 
 import gymnasium
-import numpy as np
-from gymnasium.envs.mujoco import mujoco_env
-from gymnasium.utils.ezpickle import EzPickle
-from jinja2 import Template
 
-DEFAULT_CAMERA_CONFIG = {
-    "distance": 4.0,
-}
 
-
-class ManySegmentAntEnv(mujoco_env.MujocoEnv, EzPickle):
-    """Is a vartion of the Ant environment, but with ants coupled together (each segment has a torso + 4 legs).
+def gen_asset(n_segs: int, asset_path: str) -> None:
+    """Generates a variation of the Ant environment, but with ants coupled together (each segment has a torso + 4 legs).
 
     This environment was first introduced ["FACMAC: Factored Multi-Agent Centralised Policy Gradients"](https://arxiv.org/abs/2003.06709).
     """
-
-    metadata = {
-        "render_modes": [
-            "human",
-            "rgb_array",
-            "depth_array",
-        ],
-        "render_fps": 50,
-    }
-
-    def __init__(self, n_segs: int, render_mode: typing.Optional[str] = None):
-        """Init.
-
-        Args:
-            n_segs: the number of segments of the ant (1 segment is the same as Gymansium's ant)
-            render_mode: see [Gymansium/MuJoCo](https://gymnasium.farama.org/environments/mujoco/)
-        """
-        self.healthy_reward = 1
-        self._ctrl_cost_weight = 0.5
-        self._contact_cost_weight = 5e-4
-        self._reset_noise_scale = 0.1
-
-        # Check whether asset file exists already, otherwise create it
-        asset_path = os.path.join(
-            os.path.dirname(os.path.abspath(__file__)),
-            "assets",
-            f"many_segment_ant_{n_segs}_segments.auto.xml",
+    try:
+        import jinja2
+    except ImportError as e:
+        raise gymnasium.error.dependencynotinstalled(
+            f"{e}. "
+            "(hint: you need to install jinja, run `pip install gymnasium_robotics[mamujoco]`.)"
         )
-        self._generate_asset(n_segs=n_segs, asset_path=asset_path)
 
-        observation_space = gymnasium.spaces.Box(
-            low=-np.inf,
-            high=np.inf,
-            shape=(n_segs * 50 + 17,),
-            dtype=np.float64,
-        )
-        mujoco_env.MujocoEnv.__init__(
-            self,
-            asset_path,
-            4,
-            observation_space=observation_space,
-            default_camera_config=DEFAULT_CAMERA_CONFIG,
-            render_mode=render_mode,
-        )
-        EzPickle.__init__(self, n_segs=n_segs, render_mode=render_mode)
-        os.remove(asset_path)
-
-    def _generate_asset(self, n_segs: int, asset_path: str) -> None:
-        template_path = os.path.join(
-            os.path.dirname(os.path.abspath(__file__)),
-            "assets",
-            "many_segment_ant.xml.template",
-        )
-        with open(template_path) as file:
-            template = Template(file.read())
-        body_str_template = """
-        <body name="torso_{:d}" pos="-1 0 0">
-           <!--<joint axis="0 1 0" name="nnn_{:d}" pos="0.0 0.0 0.0" range="-1 1" type="hinge"/>-->
-            <geom density="100" fromto="1 0 0 0 0 0" size="0.1" type="capsule"/>
-            <body name="front_right_leg_{:d}" pos="0 0 0">
-              <geom fromto="0.0 0.0 0.0 0.0 0.2 0.0" name="aux1_geom_{:d}" size="0.08" type="capsule"/>
-              <body name="aux_2_{:d}" pos="0.0 0.2 0">
-                <joint axis="0 0 1" name="hip1_{:d}" pos="0.0 0.0 0.0" range="-30 30" type="hinge"/>
-                <geom fromto="0.0 0.0 0.0 -0.2 0.2 0.0" name="right_leg_geom_{:d}" size="0.08" type="capsule"/>
-                <body pos="-0.2 0.2 0">
-                  <joint axis="1 1 0" name="ankle1_{:d}" pos="0.0 0.0 0.0" range="-70 -30" type="hinge"/>
-                  <geom fromto="0.0 0.0 0.0 -0.4 0.4 0.0" name="right_ankle_geom_{:d}" size="0.08" type="capsule"/>
-                </body>
-              </body>
+    template_path = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)),
+        "assets",
+        "many_segment_ant.xml.template",
+    )
+
+    with open(template_path) as file:
+        template = jinja2.Template(file.read())
+
+    body_str_template = """
+    <body name="torso_{:d}" pos="-1 0 0">
+       <!--<joint axis="0 1 0" name="nnn_{:d}" pos="0.0 0.0 0.0" range="-1 1" type="hinge"/>-->
+        <geom density="100" fromto="1 0 0 0 0 0" size="0.1" type="capsule"/>
+        <body name="front_right_leg_{:d}" pos="0 0 0">
+          <geom fromto="0.0 0.0 0.0 0.0 0.2 0.0" name="aux1_geom_{:d}" size="0.08" type="capsule"/>
+          <body name="aux_2_{:d}" pos="0.0 0.2 0">
+            <joint axis="0 0 1" name="hip1_{:d}" pos="0.0 0.0 0.0" range="-30 30" type="hinge"/>
+            <geom fromto="0.0 0.0 0.0 -0.2 0.2 0.0" name="right_leg_geom_{:d}" size="0.08" type="capsule"/>
+            <body pos="-0.2 0.2 0">
+              <joint axis="1 1 0" name="ankle1_{:d}" pos="0.0 0.0 0.0" range="-70 -30" type="hinge"/>
+              <geom fromto="0.0 0.0 0.0 -0.4 0.4 0.0" name="right_ankle_geom_{:d}" size="0.08" type="capsule"/>
             </body>
-            <body name="back_leg_{:d}" pos="0 0 0">
-              <geom fromto="0.0 0.0 0.0 0.0 -0.2 0.0" name="aux2_geom_{:d}" size="0.08" type="capsule"/>
-              <body name="aux2_{:d}" pos="0.0 -0.2 0">
-                <joint axis="0 0 1" name="hip2_{:d}" pos="0.0 0.0 0.0" range="-30 30" type="hinge"/>
-                <geom fromto="0.0 0.0 0.0 -0.2 -0.2 0.0" name="back_leg_geom_{:d}" size="0.08" type="capsule"/>
-                <body pos="-0.2 -0.2 0">
-                  <joint axis="-1 1 0" name="ankle2_{:d}" pos="0.0 0.0 0.0" range="-70 -30" type="hinge"/>
-                  <geom fromto="0.0 0.0 0.0 -0.4 -0.4 0.0" name="third_ankle_geom_{:d}" size="0.08" type="capsule"/>
-                </body>
-              </body>
+          </body>
+        </body>
+        <body name="back_leg_{:d}" pos="0 0 0">
+          <geom fromto="0.0 0.0 0.0 0.0 -0.2 0.0" name="aux2_geom_{:d}" size="0.08" type="capsule"/>
+          <body name="aux2_{:d}" pos="0.0 -0.2 0">
+            <joint axis="0 0 1" name="hip2_{:d}" pos="0.0 0.0 0.0" range="-30 30" type="hinge"/>
+            <geom fromto="0.0 0.0 0.0 -0.2 -0.2 0.0" name="back_leg_geom_{:d}" size="0.08" type="capsule"/>
+            <body pos="-0.2 -0.2 0">
+              <joint axis="-1 1 0" name="ankle2_{:d}" pos="0.0 0.0 0.0" range="-70 -30" type="hinge"/>
+              <geom fromto="0.0 0.0 0.0 -0.4 -0.4 0.0" name="third_ankle_geom_{:d}" size="0.08" type="capsule"/>
             </body>
-        """
-
-        body_close_str_template = "</body>\n"
-        actuator_str_template = """\t     <motor ctrllimited="true" ctrlrange="-1.0 1.0" joint="hip1_{:d}" gear="150"/>
-                                          <motor ctrllimited="true" ctrlrange="-1.0 1.0" joint="ankle1_{:d}" gear="150"/>
-                                          <motor ctrllimited="true" ctrlrange="-1.0 1.0" joint="hip2_{:d}" gear="150"/>
-                                          <motor ctrllimited="true" ctrlrange="-1.0 1.0" joint="ankle2_{:d}" gear="150"/>\n"""
-
-        body_str = ""
-        for i in range(1, n_segs):
-            body_str += body_str_template.format(*([i] * 16))
-        body_str += body_close_str_template * (n_segs - 1)
-
-        actuator_str = ""
-        for i in range(n_segs):
-            actuator_str += actuator_str_template.format(*([i] * 8))
-
-        rt = template.render(body=body_str, actuators=actuator_str)
-        with open(asset_path, "w") as file:
-            file.write(rt)
-
-    def step(self, action: np.ndarray):
-        """Performs a single step given the `action`.
-
-        Reward has same structure as ant
-        Does terminate when the front torso is unhealthy (in the same way as the ant)
-        """
-        x_position_before = self.get_body_com("torso_0")[0]
-        self.do_simulation(action, self.frame_skip)
-        x_position_after = self.get_body_com("torso_0")[0]
-
-        x_velocity = (x_position_after - x_position_before) / self.dt
-
-        forward_reward = x_velocity
-        healthy_reward = self.healthy_reward
-
-        ctrl_cost = self._ctrl_cost_weight * np.square(action).sum()
-        contact_cost = self._contact_cost_weight * np.sum(
-            np.square(np.clip(self.data.cfrc_ext, -1, 1))
-        )
-        contact_cost = 0  # In Gymnasium.MuJoCo-v4 contanct costs are ignored
-
-        state = self.state_vector()
-        notdone = np.isfinite(state).all() and state[2] >= 0.2 and state[2] <= 1.0
-
-        observation = self._get_obs()
-        reward = forward_reward - ctrl_cost - contact_cost + healthy_reward
-        terminated = not notdone
-        truncated = False
+          </body>
+        </body>
+    """
 
-        info = {
-            "reward_forward": forward_reward,
-            "reward_ctrl": -ctrl_cost,
-            "reward_survive": healthy_reward,
-            "x_position": x_position_after,
-            # "y_position": xy_position_after[1],
-            # "distance_from_origin": np.linalg.norm(xy_position_after, ord=2),
-            "x_velocity": x_velocity,
-            # "y_velocity": y_velocity,
-            "forward_reward": forward_reward,
-        }
+    body_close_str_template = "</body>\n"
+    actuator_str_template = """\t     <motor ctrllimited="true" ctrlrange="-1.0 1.0" joint="hip1_{:d}" gear="150"/>
+                                      <motor ctrllimited="true" ctrlrange="-1.0 1.0" joint="ankle1_{:d}" gear="150"/>
+                                      <motor ctrllimited="true" ctrlrange="-1.0 1.0" joint="hip2_{:d}" gear="150"/>
+                                      <motor ctrllimited="true" ctrlrange="-1.0 1.0" joint="ankle2_{:d}" gear="150"/>\n"""
 
-        if self.render_mode == "human":
-            self.render()
-        return (observation, reward, terminated, truncated, info)
+    body_str = ""
+    for i in range(1, n_segs):
+        body_str += body_str_template.format(*([i] * 16))
+    body_str += body_close_str_template * (n_segs - 1)
 
-    def _get_obs(self) -> np.ndarray:
-        return np.concatenate(
-            [
-                self.data.qpos.flat[2:],
-                self.data.qvel.flat,
-                np.clip(self.data.cfrc_ext, -1, 1).flat,
-            ]
-        )
+    actuator_str = ""
+    for i in range(n_segs):
+        actuator_str += actuator_str_template.format(*([i] * 8))
 
-    def reset_model(self) -> np.ndarray:
-        """Resets the model in same way as the Swimmer."""
-        qpos = self.init_qpos + self.np_random.uniform(
-            size=self.model.nq,
-            low=-self._reset_noise_scale,
-            high=self._reset_noise_scale,
-        )
-        qvel = (
-            self.init_qvel
-            + self.np_random.standard_normal(self.model.nv) * self._reset_noise_scale
-        )
-        self.set_state(qpos, qvel)
-        return self._get_obs()
+    rt = template.render(body=body_str, actuators=actuator_str)
+    with open(asset_path, "w") as file:
+        file.write(rt)
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/many_segment_swimmer.py b/gymnasium_robotics/envs/multiagent_mujoco/many_segment_swimmer.py
index b435d166..88475815 100644
--- a/gymnasium_robotics/envs/multiagent_mujoco/many_segment_swimmer.py
+++ b/gymnasium_robotics/envs/multiagent_mujoco/many_segment_swimmer.py
@@ -5,166 +5,63 @@
 Original Author: Schroeder de Witt
 
  - General code cleanup, factorization, type hinting, adding documentation and comments
- - updated API to Gymnasium.MuJoCo v4
- - increase returned info
- - renamed ManyAgentSwimmerEnv -> ManySegmentSwimmerEnv (and changed the __init__ arguments accordingly)
+ - Removed the class (but kept the `gen_asset` function)
 """
 
 
 import os
-import typing
 
 import gymnasium
-import numpy as np
-from gymnasium.envs.mujoco import mujoco_env
-from gymnasium.utils.ezpickle import EzPickle
-from jinja2 import Template
 
-DEFAULT_CAMERA_CONFIG = {
-    "distance": 4.0,
-}
 
-
-class ManySegmentSwimmerEnv(mujoco_env.MujocoEnv, EzPickle):
-    """Is a vartion of the Swimmer environment, but with many segments.
+def gen_asset(n_segs: int, asset_path: str) -> None:
+    """Generates a variation of the Swimmer environment, but with many segments.
 
     This environment was first introduced ["FACMAC: Factored Multi-Agent Centralised Policy Gradients"](https://arxiv.org/abs/2003.06709).
     """
-
-    metadata = {
-        "render_modes": [
-            "human",
-            "rgb_array",
-            "depth_array",
-        ],
-        "render_fps": 50,
-    }
-
-    def __init__(self, n_segs: int, render_mode: typing.Optional[str] = None):
-        """Init.
-
-        Args:
-            n_segs: the number of segments of the swimmer (3 segments is the same as Gymansium's swimmer)
-            render_mode: see [Gymansium/MuJoCo](https://gymnasium.farama.org/environments/mujoco/)
-        """
-        self._forward_reward_weight = 1.0
-        self._ctrl_cost_weight = 1e-4
-        self._reset_noise_scale = 0.1
-
-        # Check whether asset file exists already, otherwise create it
-        asset_path = os.path.join(
-            os.path.dirname(os.path.abspath(__file__)),
-            "assets",
-            f"many_segment_swimmer_{n_segs}_segments.auto.xml",
+    try:
+        import jinja2
+    except ImportError as e:
+        raise gymnasium.error.dependencynotinstalled(
+            f"{e}. "
+            "(hint: you need to install jinja, run `pip install gymnasium_robotics[mamujoco]`.)"
         )
-        self._generate_asset(n_segs=n_segs, asset_path=asset_path)
 
-        observation_space = gymnasium.spaces.Box(
-            low=-np.inf, high=np.inf, shape=(n_segs * 2 + 4,), dtype=np.float64
-        )
-        mujoco_env.MujocoEnv.__init__(
-            self,
-            asset_path,
-            4,
-            observation_space=observation_space,
-            default_camera_config=DEFAULT_CAMERA_CONFIG,
-            render_mode=render_mode,
-        )
-        EzPickle.__init__(self, n_segs=n_segs, render_mode=render_mode)
-        os.remove(asset_path)
-
-    def _generate_asset(self, n_segs: int, asset_path: str) -> None:
-        template_path = os.path.join(
-            os.path.dirname(os.path.abspath(__file__)),
-            "assets",
-            "many_segment_swimmer.xml.template",
-        )
-        with open(template_path) as file:
-            template = Template(file.read())
-        body_str_template = """
-        <body name="mid{:d}" pos="-1 0 0">
-          <geom density="1000" fromto="0 0 0 -1 0 0" size="0.1" type="capsule"/>
-          <joint axis="0 0 {:d}" limited="true" name="rot{:d}" pos="0 0 0" range="-100 100" type="hinge"/>
-        """
-
-        body_end_str_template = """
-        <body name="back" pos="-1 0 0">
-            <geom density="1000" fromto="0 0 0 -1 0 0" size="0.1" type="capsule"/>
-            <joint axis="0 0 1" limited="true" name="rot{:d}" pos="0 0 0" range="-100 100" type="hinge"/>
-          </body>
-        """
-
-        body_close_str_template = "</body>\n"
-        actuator_str_template = """\t <motor ctrllimited="true" ctrlrange="-1 1" gear="150.0" joint="rot{:d}"/>\n"""
-
-        body_str = ""
-        for i in range(1, n_segs - 1):
-            body_str += body_str_template.format(i, (-1) ** (i + 1), i)
-        body_str += body_end_str_template.format(n_segs - 1)
-        body_str += body_close_str_template * (n_segs - 2)
-
-        actuator_str = ""
-        for i in range(n_segs):
-            actuator_str += actuator_str_template.format(i)
-
-        rt = template.render(body=body_str, actuators=actuator_str)
-        with open(asset_path, "w") as file:
-            file.write(rt)
-
-    def step(self, action: np.ndarray):
-        """Performs a single step given the `action`.
-
-        Reward has same structure as Swimmer
-        Does never terminate (like Swimmer)
-        """
-        x_position_before = self.data.qpos[0]
-        self.do_simulation(action, self.frame_skip)
-        x_position_after = self.data.qpos[0]
-
-        x_velocity = (x_position_after - x_position_before) / self.dt
-
-        forward_reward = self._forward_reward_weight * x_velocity
-
-        ctrl_cost = self._ctrl_cost_weight * np.square(action).sum()
-
-        observation = self._get_obs()
-        reward = forward_reward - ctrl_cost
-        terminal = False
-        truncated = False
-        info = {
-            "reward_fwd": forward_reward,
-            "reward_ctrl": -ctrl_cost,
-            "x_position": x_position_after,
-            # "y_position": xy_position_after[1],
-            # "distance_from_origin": np.linalg.norm(xy_position_after, ord=2),
-            "x_velocity": x_velocity,
-            # "y_velocity": y_velocity,
-            "forward_reward": forward_reward,
-        }
-
-        if self.render_mode == "human":
-            self.render()
-        return observation, reward, terminal, truncated, info
-
-    def _get_obs(self) -> np.ndarray:
-        qpos = self.data.qpos
-        qvel = self.data.qvel
-        return np.concatenate([qpos.flat[2:], qvel.flat])
-
-    def reset_model(self) -> np.ndarray:
-        """Resets the model in same way as the Swimmer."""
-        self.set_state(
-            self.init_qpos
-            + self.np_random.uniform(
-                low=-self._reset_noise_scale,
-                high=self._reset_noise_scale,
-                size=self.model.nq,
-            ),
-            self.init_qvel
-            + self.np_random.uniform(
-                low=-self._reset_noise_scale,
-                high=self._reset_noise_scale,
-                size=self.model.nv,
-            ),
-        )
-        return self._get_obs()
+    template_path = os.path.join(
+        os.path.dirname(os.path.abspath(__file__)),
+        "assets",
+        "many_segment_swimmer.xml.template",
+    )
+
+    with open(template_path) as file:
+        template = jinja2.Template(file.read())
+
+    body_str_template = """
+    <body name="mid{:d}" pos="-1 0 0">
+      <geom density="1000" fromto="0 0 0 -1 0 0" size="0.1" type="capsule"/>
+      <joint axis="0 0 {:d}" limited="true" name="rot{:d}" pos="0 0 0" range="-100 100" type="hinge"/>
+    """
+
+    body_end_str_template = """
+    <body name="back" pos="-1 0 0">
+        <geom density="1000" fromto="0 0 0 -1 0 0" size="0.1" type="capsule"/>
+        <joint axis="0 0 1" limited="true" name="rot{:d}" pos="0 0 0" range="-100 100" type="hinge"/>
+      </body>
+    """
+
+    body_close_str_template = "</body>\n"
+    actuator_str_template = """\t <motor ctrllimited="true" ctrlrange="-1 1" gear="150.0" joint="rot{:d}"/>\n"""
+
+    body_str = ""
+    for i in range(1, n_segs - 1):
+        body_str += body_str_template.format(i, (-1) ** (i + 1), i)
+    body_str += body_end_str_template.format(n_segs - 1)
+    body_str += body_close_str_template * (n_segs - 2)
+
+    actuator_str = ""
+    for i in range(n_segs):
+        actuator_str += actuator_str_template.format(i)
+
+    rt = template.render(body=body_str, actuators=actuator_str)
+    with open(asset_path, "w") as file:
+        file.write(rt)
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/mujoco_multi.py b/gymnasium_robotics/envs/multiagent_mujoco/mujoco_multi.py
index 0d671d16..8ea964db 100755
--- a/gymnasium_robotics/envs/multiagent_mujoco/mujoco_multi.py
+++ b/gymnasium_robotics/envs/multiagent_mujoco/mujoco_multi.py
@@ -9,7 +9,8 @@
  - General code cleanup, factorization, type hinting, adding documentation and comments
  - Now uses PettingZoo APIs instead of a propriatery API
  - Now supports custom factorizations
- - Added new functions MultiAgentMujocoEnv.map_global_action_to_local_actions, MultiAgentMujocoEnv.map_local_actions_to_global_action, MultiAgentMujocoEnv.map_local_observation_to_global_state, MultiAgentMujocoEnv.map_local_observation_to_global_state
+ - Added new functions MultiAgentMujocoEnv.map_global_action_to_local_actions, MultiAgentMujocoEnv.map_local_actions_to_global_action, MultiAgentMujocoEnv.map_global_state_to_local_observations, MultiAgentMujocoEnv.map_local_observations_to_global_state
+ - Added `gym_env` argument, which can be used to load third party `Gymansium.MujocoEnv` environments.
 
 This project is covered by the Apache 2.0 License.
 """
@@ -17,42 +18,41 @@
 
 from __future__ import annotations
 
+import os
+
 import gymnasium
 import numpy as np
 import pettingzoo
 from gymnasium.wrappers import TimeLimit
 
+import gymnasium_robotics.envs.multiagent_mujoco.many_segment_ant as many_segment_ant
+import gymnasium_robotics.envs.multiagent_mujoco.many_segment_swimmer as many_segment_swimmer
 from gymnasium_robotics.envs.multiagent_mujoco.coupled_half_cheetah import (
     CoupledHalfCheetahEnv,
 )
-from gymnasium_robotics.envs.multiagent_mujoco.many_segment_ant import ManySegmentAntEnv
-from gymnasium_robotics.envs.multiagent_mujoco.many_segment_swimmer import (
-    ManySegmentSwimmerEnv,
-)
 from gymnasium_robotics.envs.multiagent_mujoco.obsk import (
     Node,
-    _observation_structure,
     build_obs,
     get_joints_at_kdist,
     get_parts_and_edges,
 )
 
-# TODO for future revisions v1?
+# TODO for future revisions v2?
 # color the renderer
 # support other Gymnasium-Robotics MuJoCo environments
 
 _MUJOCO_GYM_ENVIROMENTS = [
-    "Ant-v4",
-    "HalfCheetah-v4",
-    "Hopper-v4",
-    "HumanoidStandup-v4",
-    "Humanoid-v4",
-    "Reacher-v4",
-    "Swimmer-v4",
-    "Pusher-v4",
-    "Walker2d-v4",
-    "InvertedPendulum-v4",
-    "InvertedDoublePendulum-v4",
+    "Ant",
+    "HalfCheetah",
+    "Hopper",
+    "HumanoidStandup",
+    "Humanoid",
+    "Reacher",
+    "Swimmer",
+    "Pusher",
+    "Walker2d",
+    "InvertedPendulum",
+    "InvertedDoublePendulum",
 ]
 
 
@@ -75,10 +75,11 @@ def __init__(
         scenario: str,
         agent_conf: str | None,
         agent_obsk: int | None = 1,
-        agent_factorization: dict | None = None,
+        agent_factorization: dict[str, any] | None = None,
         local_categories: list[list[str]] | None = None,
         global_categories: tuple[str, ...] | None = None,
         render_mode: str | None = None,
+        gym_env: gymnasium.envs.mujoco.mujoco_env.MujocoEnv | None = None,
         **kwargs,
     ):
         """Init.
@@ -86,7 +87,8 @@ def __init__(
         Args:
             scenario: The Task/Environment, valid values:
                 "Ant", "HalfCheetah", "Hopper", "HumanoidStandup", "Humanoid", "Reacher", "Swimmer", "Pusher", "Walker2d", "InvertedPendulum", "InvertedDoublePendulum", "ManySegmentSwimmer", "ManySegmentAnt", "CoupledHalfCheetah"
-            agent_conf: '${Number Of Agents}x${Number Of Segments per Agent}${Optionally Additional options}', eg '1x6', '2x4', '2x4d',
+            agent_conf: Typical values:
+                '${Number Of Agents}x${Number Of Segments per Agent}${Optionally Additional options}', eg '1x6', '2x4', '2x4d',
                 If it set to None the task becomes single agent (the agent observes the entire environment, and performs all the actions)
             agent_obsk: Number of nearest joints to observe,
                 If set to 0 it only observes local state,
@@ -102,47 +104,22 @@ def __init__(
                 The default is: Check each environment's page on the "observation space" section.
             global_categories: The categories of observations extracted from the global observable space,
                 For example: if it is set to `("qpos")` out of the globally observable items of the environment, only the position items will be observed.
-                The default is: Check each environment's page on the "observation space" section.
-            render_mode: see [Gymansium/MuJoCo](https://gymnasium.farama.org/environments/mujoco/),
+                The default is: `("qpos", "qvel")`
+            render_mode: See [Gymansium/MuJoCo](https://gymnasium.farama.org/environments/mujoco/),
                 valid values: 'human', 'rgb_array', 'depth_array'
+            gym_env: A custom `MujocoEnv` envinronment, overrides generation of environment by `MaMuJoCo`.
             kwargs: Additional arguments passed to the [Gymansium/MuJoCo](https://gymnasium.farama.org/environments/mujoco/) environment,
                 Note: arguments that change the observation space will not work.
 
-            Raises: NotImplementedError: When the scenario is not supported (not part of of the valid values)
+            Raises: NotImplementedError: When the scenario is not supported (not part of of the valid values).
         """
-        scenario += "-v4"
-
-        # load the underlying single agent Gymansium MuJoCo Environment in `self.single_agent_env`
-        if scenario in _MUJOCO_GYM_ENVIROMENTS:
-            self.single_agent_env: gymnasium.envs.mujoco.mujoco_env.MujocoEnv = (
-                gymnasium.make(scenario, **kwargs, render_mode=render_mode)
-            )
-        elif scenario in ["ManySegmentAnt-v4"]:
-            assert isinstance(agent_conf, str)
-            try:
-                n_segs = int(agent_conf.split("x")[0]) * int(agent_conf.split("x")[1])
-            except Exception:
-                raise Exception(f"UNKNOWN partitioning config: {agent_conf}")
-
-            self.single_agent_env = TimeLimit(
-                ManySegmentAntEnv(n_segs, render_mode), max_episode_steps=1000
-            )
-        elif scenario in ["ManySegmentSwimmer-v4"]:
-            assert isinstance(agent_conf, str)
-            try:
-                n_segs = int(agent_conf.split("x")[0]) * int(agent_conf.split("x")[1])
-            except Exception:
-                raise Exception(f"UNKNOWN partitioning config: {agent_conf}")
-
-            self.single_agent_env = TimeLimit(
-                ManySegmentSwimmerEnv(n_segs, render_mode), max_episode_steps=1000
-            )
-        elif scenario in ["CoupledHalfCheetah-v4"]:
-            self.single_agent_env = TimeLimit(
-                CoupledHalfCheetahEnv(render_mode), max_episode_steps=1000
+        # Create underlying single agent environment
+        if gym_env is None:
+            self.single_agent_env = self._create_base_gym_env(
+                scenario, agent_conf, render_mode, **kwargs
             )
         else:
-            raise NotImplementedError("Custom env not implemented!")
+            self.single_agent_env = gym_env
 
         if agent_conf is None:
             self.agent_obsk = None
@@ -162,11 +139,9 @@ def __init__(
                 mujoco_edges = agent_factorization["edges"]
                 self.mujoco_globals = agent_factorization["globals"]
         else:
-            assert self.single_agent_env.action_space.shape is not None
-            dummy_node = Node("dummy_node", None, None, None)
             self.agent_action_partitions = [
                 tuple(
-                    dummy_node
+                    Node("dummy_node", None, None, i)
                     for i in range(self.single_agent_env.action_space.shape[0])
                 )
             ]
@@ -179,13 +154,13 @@ def __init__(
         ]
         self.agents = self.possible_agents
 
-        # load the observation categories
+        # load the observation categories (from init arguments or generate them)
         if local_categories is None:
-            self.k_categories = self._generate_local_categories(scenario)
+            self.local_categories = self._generate_local_categories(scenario)
         else:
-            self.k_categories = local_categories
+            self.local_categories = local_categories
         if global_categories is None:
-            self.global_categories = self._generate_global_categories(scenario)
+            self.global_categories = ("qpos", "qvel")
         else:
             self.global_categories = global_categories
 
@@ -200,6 +175,8 @@ def __init__(
                 for agent_id in range(self.num_agents)
             ]
 
+        self.observation_factorization = self.create_observation_mapping()
+
         # Create observation and action spaces
         self.observation_spaces, self.action_spaces = {}, {}
         for agent_id, partition in enumerate(self.agent_action_partitions):
@@ -218,6 +195,53 @@ def __init__(
                 dtype=self.single_agent_env.observation_space.dtype,
             )
 
+    def _create_base_gym_env(
+        self, scenario: str, agent_conf: str, render_mode: str, **kwargs
+    ) -> gymnasium.envs.mujoco.mujoco_env.MujocoEnv:
+        """Creates the single agent environments that is to be factorized."""
+        # load the underlying single agent Gymansium MuJoCo Environment in `self.single_agent_env`
+        if scenario in _MUJOCO_GYM_ENVIROMENTS:
+            return gymnasium.make(f"{scenario}-v5", **kwargs, render_mode=render_mode)
+        elif scenario in ["ManySegmentAnt"]:
+            try:
+                n_segs = int(agent_conf.split("x")[0]) * int(agent_conf.split("x")[1])
+            except Exception:
+                raise Exception(f"UNKNOWN partitioning config: {agent_conf}")
+
+            asset_path = os.path.join(
+                os.path.dirname(os.path.abspath(__file__)),
+                "assets",
+                f"many_segment_ant_{n_segs}_segments.auto.xml",
+            )
+            many_segment_ant.gen_asset(n_segs=n_segs, asset_path=asset_path)
+            single_agent_env = gymnasium.make(
+                "Ant-v5", xml_file=asset_path, **kwargs, render_mode=render_mode
+            )
+            os.remove(asset_path)
+            return single_agent_env
+        elif scenario in ["ManySegmentSwimmer"]:
+            try:
+                n_segs = int(agent_conf.split("x")[0]) * int(agent_conf.split("x")[1])
+            except Exception:
+                raise Exception(f"UNKNOWN partitioning config: {agent_conf}")
+
+            asset_path = os.path.join(
+                os.path.dirname(os.path.abspath(__file__)),
+                "assets",
+                f"many_segment_swimmer_{n_segs}_segments.auto.xml",
+            )
+            many_segment_swimmer.gen_asset(n_segs=n_segs, asset_path=asset_path)
+            single_agent_env = gymnasium.make(
+                "Swimmer-v5", xml_file=asset_path, **kwargs, render_mode=render_mode
+            )
+            os.remove(asset_path)
+            return single_agent_env
+        elif scenario in ["CoupledHalfCheetah"]:
+            return TimeLimit(CoupledHalfCheetahEnv(render_mode), max_episode_steps=1000)
+        else:
+            breakpoint()
+            raise NotImplementedError("Custom env not implemented!")
+
     def step(
         self, actions: dict[str, np.ndarray]
     ) -> tuple[
@@ -322,8 +346,8 @@ def map_global_action_to_local_actions(
         return local_actions
 
     def map_global_state_to_local_observations(
-        self, global_state: np.ndarray
-    ) -> dict[str, np.ndarray]:
+        self, global_state: np.ndarray[np.float64]
+    ) -> dict[str, np.ndarray[np.float64]]:
         """Maps single agent observation into multi agent observation spaces.
 
         Args:
@@ -333,8 +357,74 @@ def map_global_state_to_local_observations(
         Returns:
             A dictionary of states that would be observed by each agent given the 'global_state'
         """
+        assert (
+            self.observation_factorization is not None
+        ), "to map states the MuJoCo environment must have `observation_structure` member variable"
+        global_state = np.array(global_state)
+
+        local_observation = {}
+        for agent, partition in self.observation_factorization.items():
+            local_observation[agent] = global_state[partition]
+
+        # assert sizes
+        assert len(local_observation) == len(self.action_spaces)
+        for agent in self.possible_agents:
+            assert (
+                len(local_observation[agent]) == self.observation_spaces[agent].shape[0]
+            )
+
+        return local_observation
+
+    def map_local_observations_to_global_state(
+        self, local_observation: np.ndarray[np.float64]
+    ) -> np.ndarray[np.float64]:
+        """Maps multi agent observations into single agent observation space.
+
+        Args:
+            local_obserations:
+                the local observation of each agents (generated from MaMuJoCo.step())
+
+        Returns:
+            the global observations that correspond to a single agent (what you would get with MaMuJoCo.state())
+        """
+        assert (
+            self.observation_factorization is not None
+        ), "to map states the MuJoCo environment must have `observation_structure` member variable"
+
+        global_observation = (
+            np.zeros((self.single_agent_env.observation_space.shape[0],)) + np.nan
+        )
+
+        for agent, partition in self.observation_factorization.items():
+            for local_idx, global_idx in enumerate(partition):
+                assert (
+                    np.isnan(global_observation[global_idx])
+                    or global_observation[global_idx]
+                    == local_observation[agent][local_idx]
+                ), "FATAL: At least one gym_env observation is doubly defined!"
+                global_observation[global_idx] = local_observation[agent][local_idx]
+
+        assert not np.isnan(
+            global_observation
+        ).any(), "FATAL: At least one gym_env observation is undefined, observations can not be mapped."
+        return global_observation
+
+    def create_observation_mapping(self) -> dict[str, np.ndarray[np.float64]]:
+        """Creates a cache of the observation factorization.
+
+        The cache is intended to be used with `map_global_state_to_local_observations` & `map_local_observations_to_global_state`.
+
+        Returns:
+            A cache that indexes global osbervations to local.
+        """
         if self.agent_obsk is None:
-            return {self.possible_agents[0]: global_state}
+            return {
+                self.possible_agents[0]: np.arange(
+                    self.single_agent_env.observation_space.shape[0]
+                )
+            }
+        if not hasattr(self.single_agent_env.unwrapped, "observation_structure"):
+            return None
 
         class data_struct:
             def __init__(self, qpos, qvel, cinert, cvel, qfrc_actuator, cfrc_ext):
@@ -345,43 +435,63 @@ def __init__(self, qpos, qvel, cinert, cvel, qfrc_actuator, cfrc_ext):
                 self.qfrc_actuator = qfrc_actuator
                 self.cfrc_ext = cfrc_ext
 
-        obs_struct = _observation_structure(self.single_agent_env.spec.id)
+        obs_struct = self.single_agent_env.unwrapped.observation_structure
         qpos_end_index = obs_struct["qpos"]
         qvel_end_index = qpos_end_index + obs_struct["qvel"]
-        cinert_end_index = qvel_end_index + obs_struct["cinert"]
-        cvel_end_index = cinert_end_index + obs_struct["cvel"]
-        qfrc_actuator_end_index = cvel_end_index + obs_struct["qfrc_actuator"]
-        cfrc_ext_end_index = qfrc_actuator_end_index + obs_struct["cfrc_ext"]
+        cinert_end_index = qvel_end_index + obs_struct.get("cinert", 0)
+        cvel_end_index = cinert_end_index + obs_struct.get("cvel", 0)
+        qfrc_actuator_end_index = cvel_end_index + obs_struct.get("qfrc_actuator", 0)
+        cfrc_ext_end_index = qfrc_actuator_end_index + obs_struct.get("cfrc_ext", 0)
 
-        assert len(global_state) == cfrc_ext_end_index
+        global_index = np.arange(self.single_agent_env.observation_space.shape[0])
+        assert len(global_index) == cfrc_ext_end_index, "wrong indexing"
 
         mujoco_data = data_struct(
             qpos=np.concatenate(
-                (
-                    np.zeros(obs_struct["skipped_qpos"]),
-                    global_state[0:qpos_end_index],
-                )
+                [
+                    np.zeros(obs_struct["skipped_qpos"], dtype=np.int64),
+                    global_index[0:qpos_end_index],
+                ]
+            ),
+            qvel=np.array(global_index[qpos_end_index:qvel_end_index]),
+            cinert=np.concatenate(
+                [
+                    np.zeros(10, dtype=np.int64),
+                    global_index[qvel_end_index:cinert_end_index],
+                ]
             ),
-            qvel=np.array(global_state[qpos_end_index:qvel_end_index]),
-            cinert=np.array(global_state[qvel_end_index:cinert_end_index]),
-            cvel=np.array(global_state[cinert_end_index:cvel_end_index]),
-            qfrc_actuator=np.array(
-                global_state[cvel_end_index:qfrc_actuator_end_index]
+            cvel=np.concatenate(
+                [
+                    np.zeros(6, dtype=np.int64),
+                    global_index[cinert_end_index:cvel_end_index],
+                ]
+            ),
+            qfrc_actuator=np.concatenate(
+                [
+                    np.zeros(6, dtype=np.int64),
+                    global_index[cvel_end_index:qfrc_actuator_end_index],
+                ]
+            ),
+            cfrc_ext=np.concatenate(
+                [
+                    np.zeros(6, dtype=np.int64),
+                    global_index[qfrc_actuator_end_index:cfrc_ext_end_index],
+                ]
             ),
-            cfrc_ext=np.array(global_state[qfrc_actuator_end_index:cfrc_ext_end_index]),
         )
 
-        if len(mujoco_data.cinert) != 0:
+        if len(mujoco_data.cinert) > 10:
             mujoco_data.cinert = np.reshape(
-                mujoco_data.cinert, self.single_agent_env.data.cinert.shape
+                mujoco_data.cinert, self.single_agent_env.unwrapped.data.cinert.shape
             )
-        if len(mujoco_data.cvel) != 0:
+        if len(mujoco_data.cvel) > 6:
             mujoco_data.cvel = np.reshape(
-                mujoco_data.cvel, self.single_agent_env.data.cvel.shape
+                mujoco_data.cvel, self.single_agent_env.unwrapped.data.cvel.shape
             )
-        if len(mujoco_data.cfrc_ext) != 0:
+        if len(mujoco_data.cfrc_ext) > 6:
             mujoco_data.cfrc_ext = np.reshape(
-                mujoco_data.cfrc_ext, self.single_agent_env.data.cfrc_ext.shape
+                mujoco_data.cfrc_ext,
+                self.single_agent_env.unwrapped.data.cfrc_ext.shape,
             )
 
         assert len(self.single_agent_env.unwrapped.data.qpos.flat) == len(
@@ -391,28 +501,10 @@ def __init__(self, qpos, qvel, cinert, cvel, qfrc_actuator, cfrc_ext):
             mujoco_data.qvel
         )
 
-        observations = {}
+        local_index = {}
         for agent_id, agent in enumerate(self.possible_agents):
-            observations[agent] = self._get_obs_agent(agent_id, mujoco_data)
-        return observations
-
-    def map_local_observation_to_global_state(
-        self, local_observations: dict[str, np.ndarray]
-    ) -> np.ndarray:
-        """Maps multi agent observations into single agent observation space.
-
-        NOT IMPLEMENTED, try using MaMuJoCo.state() instead
-
-        Args:
-            local_obserations:
-                the local observation of each agents (generated from MaMuJoCo.step())
-
-        Returns:
-            the global observations that correspond to a single agent (what you would get with MaMuJoCo.state())
-        """
-        # Dev notes for anyone who attempts to implement it:
-        # - Depending on the factorization the local observations may not observe the total global observable space, you will need to handle that
-        raise NotImplementedError
+            local_index[agent] = self._get_obs_agent(agent_id, mujoco_data)
+        return local_index
 
     def observation_space(self, agent: str) -> gymnasium.spaces.Box:
         """See [pettingzoo.utils.env.ParallelEnv.observation_space](https://pettingzoo.farama.org/api/parallel/#pettingzoo.utils.env.ParallelEnv.observation_space)."""
@@ -446,28 +538,32 @@ def _get_obs_agent(self, agent_id: int, data=None) -> np.ndarray:
         """
         if self.agent_obsk is None:
             return self.single_agent_env.unwrapped._get_obs()
+
+        index_only = True
         if data is None:
-            data = self.single_agent_env.data
+            data = self.single_agent_env.unwrapped.data
+            index_only = False
 
         return build_obs(
             data,
             self.k_dicts[agent_id],
-            self.k_categories,
+            self.local_categories,
             self.mujoco_globals,
             self.global_categories,
+            index_only,
         )
 
-    def reset(self, seed: int | None = None, options=None):
+    def reset(self, seed: int | None = None, options: dict[str, any] | None = None):
         """Resets the the `single_agent_env`.
 
         Args:
-            seed: see [pettingzoo.utils.env.ParallelEnv.reset()](https://pettingzoo.farama.org/api/parallel/#pettingzoo.utils.env.ParallelEnv.reset) doc
-            options: Ignored arguments
+            seed: see [pettingzoo.utils.env.ParallelEnv.reset()](https://pettingzoo.farama.org/api/parallel/#pettingzoo.utils.env.ParallelEnv.reset) doc.
+            options: passed to the single agent env's `reset`.
 
         Returns:
             Initial observations and info
         """
-        _, info_n = self.single_agent_env.reset(seed=seed)
+        _, info_n = self.single_agent_env.reset(seed=seed, options=options)
         info = {}
         for agent in self.possible_agents:
             info[agent] = info_n
@@ -487,10 +583,6 @@ def close(self):
         """See [pettingzoo.utils.env.ParallelEnv.close](https://pettingzoo.farama.org/api/parallel/#pettingzoo.utils.env.ParallelEnv.close)."""
         self.single_agent_env.close()
 
-    def seed(self, seed: int | None = None):
-        """Not implemented use env.reset(seed=...) instead."""
-        raise NotImplementedError("use env.reset(seed=...) instead")
-
     def _generate_local_categories(self, scenario: str) -> list[list[str]]:
         """Generated the default observation categories for each observation depth.
 
@@ -503,48 +595,30 @@ def _generate_local_categories(self, scenario: str) -> list[list[str]]:
         if self.agent_obsk is None:
             return [[]]
 
-        if scenario in ["Ant-v4", "ManySegmentAnt"]:
-            # k_split = ["qpos,qvel,cfrc_ext", "qpos"]  # Gymansium.MuJoCo.Ant-v4 has disabled cfrc_ext by default
-            k_split = ["qpos,qvel", "qpos"]
-        elif scenario in ["Humanoid-v4", "HumanoidStandup-v4"]:
-            k_split = [
-                "qpos,qvel,cinert,cvel,qfrc_actuator,cfrc_ext",
-                "qpos",
+        if scenario in ["Ant", "ManySegmentAnt"]:
+            k_categories = [["qpos", "qvel", "cfrc_ext"], ["qpos"]]
+        elif scenario in ["Humanoid", "HumanoidStandup"]:
+            k_categories = [
+                ["qpos", "qvel", "cinert", "cvel", "qfrc_actuator", "cfrc_ext"],
+                ["qpos"],
             ]
-        elif scenario in ["CoupledHalfCheetah-v4"]:
-            k_split = ["qpos,qvel,ten_J,ten_length,ten_velocity", "qpos"]
-        elif scenario in ["Reacher-v4"]:
-            k_split = ["qpos,qvel,fingertip_dist", "qpos"]
+        elif scenario in ["CoupledHalfCheetah"]:
+            k_categories = [
+                ["qpos", "qvel", "ten_J", "ten_length", "ten_velocity"],
+                ["qpos"],
+            ]
+        elif scenario in ["Reacher"]:
+            k_categories = [["qpos", "qvel", "fingertip_dist"], ["qpos"]]
         else:
-            k_split = ["qpos,qvel", "qpos"]
+            k_categories = [["qpos", "qvel"], ["qpos"]]
 
+        # extend the length of categories to match `self.agent_obsk` by repeating the last element
         categories = [
-            k_split[k if k < len(k_split) else -1].split(",")
+            k_categories[k if k < len(k_categories) else -1]
             for k in range(self.agent_obsk + 1)
         ]
         return categories
 
-    def _generate_global_categories(self, scenario: str) -> tuple[str, ...]:
-        """Generates the default global categories of observations.
-
-        Args:
-            scenario: The name of the MuJoCo Task
-
-        Returns:
-            The default Global Categories for the scenario (a list of all observable types for that domain)
-        """
-        if self.agent_obsk is None:
-            return ()
-
-        if scenario in ["Ant-v4", "ManySegmentAnt"]:
-            return ("qpos", "qvel")
-        elif scenario in ["Humanoid-v4", "HumanoidStandup-v4"]:
-            return ("qpos", "qvel", "cinert", "cvel", "qfrc_actuator", "cfrc_ext")
-        elif scenario in ["CoupledHalfCheetah-v4"]:
-            return ("qpos", "qvel")
-        else:
-            return ("qpos", "qvel")
-
 
 # These are the export functions (for `PettingZoo` style exportations)
 env = pettingzoo.utils.conversions.aec_wrapper_fn(MultiAgentMujocoEnv)
diff --git a/gymnasium_robotics/envs/multiagent_mujoco/obsk.py b/gymnasium_robotics/envs/multiagent_mujoco/obsk.py
index 35389e4c..172058d0 100644
--- a/gymnasium_robotics/envs/multiagent_mujoco/obsk.py
+++ b/gymnasium_robotics/envs/multiagent_mujoco/obsk.py
@@ -17,7 +17,6 @@
  - `Walker2D`: Added missing Global Observations
  - `CoupledHalfCheetah`: improved node naming, fixed tendon Jacobian observations, fixed action mapping of the second cheetah, added missing global observationsm, fixed action ordering
  - `ManySegmentAnt`: Fixed Global Observations
- - added new functions: `_observation_structure`
 
 This project is covered by the Apache 2.0 License.
 """
@@ -157,18 +156,20 @@ def _adjacent(lst):  # return all sets adjacent to any element in lst
 def build_obs(
     data,
     k_dict: dict[int, list[Node]],
-    k_categories: list[list[str]],
+    local_categories: list[list[str]],
     global_nodes: list[Node],
     global_categories: tuple[str, ...],
+    ignore_body_fn: bool = False,
 ) -> np.ndarray:
     """Given a k_dict from get_joints_at_kdist, extract observation vector.
 
     Args:
-        data: a structure containing the global state of the agent
-        k_dict: the k_dict of an agent
-        k_categories: the categories at every depth level
-        global_nodes: The MuJoCo global godes
-        global_categories: The observation Categories for the global MuJoCo nodes
+        data: a structure containing the global state of the agent.
+        k_dict: the k_dict of an agent.
+        local_categories: the categories at every depth level.
+        global_nodes: The MuJoCo global godes.
+        global_categories: The observation Categories for the global MuJoCo nodes.
+        ingore_body_fn: If `True` it ignores the nodes's `body_fn` membeer variable.
 
     Returns:
         observation for the agent (indicated by K_dict)
@@ -178,7 +179,7 @@ def build_obs(
     # Add local observations
     for k in sorted(list(k_dict.keys())):
         for node in k_dict[k]:
-            for category in k_categories[k]:
+            for category in local_categories[k]:
                 if category in node.extra_obs:
                     items = node.extra_obs[category](data).tolist()
                     obs_lst.extend(items if isinstance(items, list) else [items])
@@ -195,7 +196,7 @@ def build_obs(
                             body_set_dict[category] = set()
                         if body not in body_set_dict[category]:
                             items = getattr(data, category)[body].tolist()
-                            if node.body_fn is not None:
+                            if node.body_fn is not None and not ignore_body_fn:
                                 items = node.body_fn(body, items)
                             obs_lst.extend(
                                 items if isinstance(items, list) else [items]
@@ -220,7 +221,7 @@ def build_obs(
                         body_set_dict[category] = set()
                     if body not in body_set_dict[category]:
                         items = getattr(data, category)[body].tolist()
-                        if joint.body_fn is not None:
+                        if joint.body_fn is not None and not ignore_body_fn:
                             items = joint.body_fn(body, items)
                         obs_lst.extend(items if isinstance(items, list) else [items])
                         body_set_dict[category].add(body)
@@ -240,8 +241,7 @@ def get_parts_and_edges(  # noqa: C901
     Returns:
         the partition of the mujoco graph nodes, the graph edges, and global nodes
     """
-    if label in ["HalfCheetah-v4"]:
-
+    if label in ["HalfCheetah"]:
         # define Mujoco graph
         bthigh = Node("bthigh", -6, -6, 0)
         bshin = Node("bshin", -5, -5, 1)
@@ -276,8 +276,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["Ant-v4"]:
-
+    elif label in ["Ant"]:
         # define Mujoco graph
         torso = 1
         front_left_leg = 2
@@ -366,18 +365,17 @@ def get_parts_and_edges(  # noqa: C901
             HyperEdge(hip4, hip1, hip2, hip3),
         ]
 
-        torso = Node(
-            "torso",
+        root = Node(
+            "root",
             0,
             0,
             None,
             extra_obs={
                 "qpos": lambda data: data.qpos[2:7],
                 "qvel": lambda data: data.qvel[:6],
-                "cfrc_ext": lambda data: np.clip(data.cfrc_ext[0:1], -1, 1),
             },
         )
-        globals = [torso]
+        globals = [root]
 
         if partitioning is None:
             parts = [(hip4, ankle4, hip1, ankle1, hip2, ankle2, hip3, ankle3)]
@@ -392,8 +390,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["Hopper-v4"]:
-
+    elif label in ["Hopper"]:
         # define Mujoco-Graph
         thigh_joint = Node(
             "thigh_joint",
@@ -467,7 +464,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["Humanoid-v4", "HumanoidStandup-v4"]:
+    elif label in ["Humanoid", "HumanoidStandup"]:
         # bodies
         # worldbody = 0
         torso = 1
@@ -549,8 +546,6 @@ def get_parts_and_edges(  # noqa: C901
             extra_obs={
                 "qpos": lambda data: data.qpos[2:7],
                 "qvel": lambda data: data.qvel[:6],
-                "qfrc_actuator": lambda data: data.qfrc_actuator[:6],
-                # "cfrc_ext": lambda data: np.clip(data.cfrc_ext[0:1], -1, 1),
             },
         )
         globals = [root]
@@ -608,7 +603,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["Reacher-v4"]:
+    elif label in ["Reacher"]:
         # define Mujoco-Graph
         # worldbody = 0
         body0 = 1
@@ -679,7 +674,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["Pusher-v4"]:
+    elif label in ["Pusher"]:
         # define Mujoco-Graph
         r_shoulder_pan_joint = Node("r_wrist_roll_joint", 0, 0, 0)
         r_shoulder_lift_joint = Node("r_wrist_roll_joint", 1, 1, 1)
@@ -759,7 +754,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["Swimmer-v4"]:
+    elif label in ["Swimmer"]:
         # define Mujoco-Graph
         joint0 = Node(
             "rot2",
@@ -794,7 +789,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["Walker2d-v4"]:
+    elif label in ["Walker2d"]:
         # define Mujoco-Graph
         thigh_joint = Node("thigh_joint", -6, -6, 0)
         leg_joint = Node("leg_joint", -5, -5, 1)
@@ -815,7 +810,7 @@ def get_parts_and_edges(  # noqa: C901
         )
         root_z = Node("root_z", 1, 1, None)
         root_y = Node("root_y", 2, 2, None)
-        globals = [root_x, root_x, root_z]
+        globals = [root_x, root_z, root_y]
 
         if partitioning is None:
             parts = [
@@ -844,7 +839,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["CoupledHalfCheetah-v4"]:
+    elif label in ["CoupledHalfCheetah"]:
         # define Mujoco graph
         tendon = 0
 
@@ -940,7 +935,7 @@ def get_parts_and_edges(  # noqa: C901
 
         return parts, edges, globals
 
-    elif label in ["ManySegmentSwimmer-v4"]:
+    elif label in ["ManySegmentSwimmer"]:
         assert partitioning is not None, "Partitioning, required with " + label
 
         try:
@@ -965,7 +960,7 @@ def get_parts_and_edges(  # noqa: C901
         ]
         return parts, edges, globals
 
-    elif label in ["ManySegmentAnt-v4"]:
+    elif label in ["ManySegmentAnt"]:
         assert partitioning is not None, "Partitioning, required with " + label
 
         try:
@@ -1062,74 +1057,3 @@ def get_parts_and_edges(  # noqa: C901
         return parts, edges, globals
     else:
         raise Exception(f"UNKNOWN label environment: {label}")
-
-
-def _observation_structure(scenario: str) -> dict[str, int]:
-    """Get the types of observations for each Gymnasium.MuJoCo environment.
-
-    Args:
-        scenario: the mujoco scenartio
-
-    Returns:
-        a dictionary keyied by observation type with values indicating the number of observations for that type
-    """
-    ret = {
-        "skipped_qpos": 0,  # Position data what is excluded/skip
-        "qpos": 0,  # Position
-        "qvel": 0,  # Velocity
-        "cinert": 0,  # com inertia
-        "cvel": 0,  # com velocity
-        "qfrc_actuator": 0,  # Actuator Forces
-        "cfrc_ext": 0,  # Contact Forces
-    }
-
-    if scenario == "Ant-v4":
-        ret["skipped_qpos"] = 2
-        ret["qpos"] = 13
-        ret["qvel"] = 14
-        # ret["cfrc_ext"] = 84
-    elif scenario == "HalfCheetah-v4":
-        ret["skipped_qpos"] = 1
-        ret["qpos"] = 8
-        ret["qvel"] = 9
-    elif scenario == "Hopper-v4":
-        ret["skipped_qpos"] = 1
-        ret["qpos"] = 5
-        ret["qvel"] = 6
-    elif scenario == "HumanoidStandup-v4" or scenario == "Humanoid-v4":
-        ret["skipped_qpos"] = 2
-        ret["qpos"] = 22
-        ret["qvel"] = 23
-        ret["cinert"] = 140
-        ret["cvel"] = 84
-        ret["qfrc_actuator"] = 23
-        ret["cfrc_ext"] = 84
-    elif scenario == "InvertedDoublePendulum-v4":
-        assert False, scenario + "can not be factorized"
-        ret["qpos"] = 3
-        ret["qvel"] = 3
-        # qfrc_constraint = 3
-    elif scenario == "InvertedPendulum-v4":
-        assert False, scenario + "can not be factorized"
-        ret["qpos"] = 2
-        ret["qvel"] = 2
-    elif scenario == "Pusher-v4":
-        assert False, scenario + "is not supported"
-        ret["qpos"] = 7
-        ret["qvel"] = 7
-        # 9 body_com
-    elif scenario == "Reacher-v4":
-        assert False, scenario + "can not be factorized"
-        ret["qpos"] = 6
-        ret["qvel"] = 2
-        # 3 body_com
-    elif scenario == "Swimmer-v4":
-        ret["skipped_qpos"] = 2
-        ret["qpos"] = 3
-        ret["qvel"] = 5
-    elif scenario == "Walker2d-v4":
-        ret["skipped_qpos"] = 1
-        ret["qpos"] = 8
-        ret["qvel"] = 9
-
-    return ret
diff --git a/tests/envs/MaMuJoCo/test_MaMuJoCo.py b/tests/envs/MaMuJoCo/test_MaMuJoCo.py
index 1570b682..feeb05c4 100644
--- a/tests/envs/MaMuJoCo/test_MaMuJoCo.py
+++ b/tests/envs/MaMuJoCo/test_MaMuJoCo.py
@@ -1,61 +1,111 @@
 from __future__ import annotations
 
 import collections
+import os
 
+import gymnasium
 import pytest
 from gymnasium.utils.env_checker import data_equivalence
+from gymnasium.utils.env_match import check_environments_match
 from pettingzoo.test import parallel_api_test
 
-from gymnasium_robotics import mamujoco_v0
+import gymnasium_robotics.envs.multiagent_mujoco.many_segment_swimmer as many_segment_swimmer
+from gymnasium_robotics import mamujoco_v1
 
-scenario_conf = collections.namedtuple("scenario_conf", "scenario, conf")
+scenario_conf = collections.namedtuple("scenario_conf", "scenario, conf, kwargs")
 
 pre_defined_factorizations = [
-    scenario_conf("InvertedPendulum", None),  # For Debugging
-    scenario_conf("Ant", None),
-    scenario_conf("Ant", "2x4"),
-    scenario_conf("Ant", "2x4d"),
-    scenario_conf("Ant", "4x2"),
-    scenario_conf("HalfCheetah", "2x3"),
-    scenario_conf("HalfCheetah", "6x1"),
-    scenario_conf("HalfCheetah", None),
-    scenario_conf("Hopper", "3x1"),
-    scenario_conf("Hopper", None),
-    scenario_conf("Humanoid", "9|8"),
-    scenario_conf("Humanoid", None),
-    scenario_conf("HumanoidStandup", "9|8"),
-    scenario_conf("HumanoidStandup", None),
-    scenario_conf("Reacher", "2x1"),
-    scenario_conf("Reacher", None),
-    scenario_conf("Swimmer", "2x1"),
-    scenario_conf("Swimmer", None),
-    scenario_conf("Pusher", "3p"),
-    scenario_conf("Pusher", None),
-    scenario_conf("Walker2d", "2x3"),
-    scenario_conf("Walker2d", None),
-]
-
-sample_configurations = [
-    scenario_conf("ManySegmentSwimmer", "10x2"),
-    # scenario_conf("ManySegmentSwimmer", "5x4"),
-    scenario_conf("ManySegmentSwimmer", "6x1"),
-    scenario_conf("ManySegmentAnt", "2x3"),
-    scenario_conf("ManySegmentAnt", "3x1"),
-    scenario_conf("CoupledHalfCheetah", "1p1"),
-    scenario_conf("CoupledHalfCheetah", None),
+    scenario_conf("InvertedPendulum", None, {}),  # For Debugging
+    scenario_conf("Ant", None, {}),
+    scenario_conf("Ant", "2x4", {}),
+    scenario_conf("Ant", "2x4d", {}),
+    scenario_conf("Ant", "4x2", {}),
+    scenario_conf("Ant", "2x4", {}),
+    scenario_conf("Ant", "2x4d", {}),
+    scenario_conf(
+        "Ant",
+        "2x4",
+        {
+            "local_categories": [["qpos", "qvel"], ["qpos"], ["qpos"]],
+            "include_cfrc_ext_in_observation": False,
+        },
+    ),
+    scenario_conf(
+        "Ant",
+        "2x4d",
+        {
+            "local_categories": [["qpos", "qvel"], ["qpos"], ["qpos"]],
+            "include_cfrc_ext_in_observation": False,
+        },
+    ),
+    scenario_conf(
+        "Ant",
+        "4x2",
+        {
+            "local_categories": [["qpos", "qvel"], ["qpos"], ["qpos"]],
+            "include_cfrc_ext_in_observation": False,
+        },
+    ),
+    scenario_conf("HalfCheetah", "2x3", {}),
+    scenario_conf("HalfCheetah", "6x1", {}),
+    scenario_conf("HalfCheetah", None, {}),
+    scenario_conf("Hopper", "3x1", {}),
+    scenario_conf("Hopper", None, {}),
+    scenario_conf("Humanoid", "9|8", {}),
+    scenario_conf(
+        "Humanoid",
+        "9|8",
+        {
+            "local_categories": [["qpos", "qvel"], ["qpos"], ["qpos"]],
+            "include_cinert_in_observation": False,
+            "include_cvel_in_observation": False,
+            "include_qfrc_actuator_in_observation": False,
+            "include_cfrc_ext_in_observation": False,
+        },
+    ),
+    scenario_conf("Humanoid", None, {}),
+    scenario_conf("HumanoidStandup", "9|8", {}),
+    scenario_conf(
+        "HumanoidStandup",
+        "9|8",
+        {
+            "local_categories": [["qpos", "qvel"], ["qpos"], ["qpos"]],
+            "include_cinert_in_observation": False,
+            "include_cvel_in_observation": False,
+            "include_qfrc_actuator_in_observation": False,
+            "include_cfrc_ext_in_observation": False,
+        },
+    ),
+    scenario_conf("HumanoidStandup", None, {}),
+    scenario_conf("Reacher", "2x1", {}),
+    scenario_conf("Reacher", None, {}),
+    scenario_conf("Swimmer", "2x1", {}),
+    scenario_conf("Swimmer", None, {}),
+    scenario_conf("Pusher", "3p", {}),
+    scenario_conf("Pusher", None, {}),
+    scenario_conf("Walker2d", "2x3", {}),
+    scenario_conf("Walker2d", None, {}),
+    scenario_conf("ManySegmentSwimmer", "10x2", {}),
+    scenario_conf("ManySegmentSwimmer", "5x4", {}),
+    scenario_conf("ManySegmentSwimmer", "6x1", {}),
+    scenario_conf("ManySegmentSwimmer", "1x2", {}),
+    scenario_conf("ManySegmentAnt", "2x3", {}),
+    scenario_conf("ManySegmentAnt", "3x1", {}),
+    scenario_conf("CoupledHalfCheetah", "1p1", {}),
+    scenario_conf("CoupledHalfCheetah", None, {}),
 ]
 
 observation_depths = [None, 0, 1, 2]
 
 
 @pytest.mark.parametrize("observation_depth", observation_depths)
-@pytest.mark.parametrize("task", pre_defined_factorizations + sample_configurations)
+@pytest.mark.parametrize("task", pre_defined_factorizations)
 def test_general(observation_depth, task) -> None:
     """Asserts that the environments are compliant with `pettingzoo.utils.env.ParallelEnv` API."""
     parallel_api_test(
         # MultiAgentMujocoEnv(task.scenario, task.conf, agent_obsk=observation_depth),
-        mamujoco_v0.parallel_env(
-            task.scenario, task.conf, agent_obsk=observation_depth
+        mamujoco_v1.parallel_env(
+            task.scenario, task.conf, agent_obsk=observation_depth, **task.kwargs
         ),
         num_cycles=1_000_000,
     )
@@ -65,9 +115,10 @@ def test_general(observation_depth, task) -> None:
 @pytest.mark.parametrize("task", pre_defined_factorizations)
 def test_action_and_observation_mapping(observation_depth, task):
     """Assert that converting local <-> global <-> local obervations/actions results in the same observation/actions."""
-    test_env = mamujoco_v0.parallel_env(
-        task.scenario, task.conf, agent_obsk=observation_depth
+    test_env = mamujoco_v1.parallel_env(
+        task.scenario, task.conf, agent_obsk=observation_depth, **task.kwargs
     )
+
     # assert action mapping
     global_action = test_env.single_agent_env.action_space.sample()
     assert (
@@ -77,8 +128,11 @@ def test_action_and_observation_mapping(observation_depth, task):
         )
     ).all()
 
-    if task.scenario in ["Reacher", "Pusher"] and task.conf is not None:
-        return  # observation mapping not implemented on "Reacher" and "Pusher" Environment
+    if (
+        task.scenario in ["Reacher", "Pusher", "CoupledHalfCheetah"]
+        and task.conf is not None
+    ):
+        return  # observation mapping not implemented on those environments
 
     # assert observation mapping
     test_env.reset()
@@ -90,22 +144,22 @@ def test_action_and_observation_mapping(observation_depth, task):
         local_observations,
     )
 
+    if (
+        task.scenario in ["ManySegmentSwimmer", "ManySegmentAnt"]
+        and task.conf is not None
+    ):
+        return  # mapping local to global observation is not supported on these environments since the local observation do not observe the full environment
 
-@pytest.mark.parametrize("observation_depth", observation_depths)
-@pytest.mark.parametrize("task", sample_configurations)
-def test_action_mapping(observation_depth, task):
-    # observation mapping not implemented non-Gymansium mujoco environments
-    """Assert that converting local <-> global <-> local actions results in the same actions."""
-    test_env = mamujoco_v0.parallel_env(
-        task.scenario, task.conf, agent_obsk=observation_depth
+    data_equivalence(
+        test_env.map_local_observations_to_global_state(local_observations),
+        global_observations,
     )
-    global_action = test_env.single_agent_env.action_space.sample()
-    assert (
-        global_action
-        == test_env.map_local_actions_to_global_action(
-            test_env.map_global_action_to_local_actions(global_action)
-        )
-    ).all()
+
+    # sanity check making sure the observation factorizations are sane
+    for agent_obs_factor in test_env.observation_factorization.values():
+        len(agent_obs_factor) != len(
+            set(agent_obs_factor)
+        ), "an agent observes the same state value multiple times"
 
 
 # The black formatter was disabled because it results in `k_dicts_tasks` being an unreadable mess
@@ -141,7 +195,19 @@ def test_k_dict(task):
     If this test fails it means either the factorization in `obsk.get_parts_and_edges()` is wrong or that `obsk.get_joints_at_kdist()` generates wrong k_dict
     """
     for k, k_dict in enumerate(task.list_k_dicts):
-        test_env = mamujoco_v0.parallel_env(
+        test_env = mamujoco_v1.parallel_env(
             scenario=task.scenario, agent_conf=task.conf, agent_obsk=k
         )
         assert str(test_env.k_dicts) == k_dict, str(test_env.k_dicts)
+
+
+def test_swimmer_gen():
+    """Assert that the many segment swimmer environment is identical to the simple environments."""
+    env = gymnasium.make("Swimmer-v5")
+
+    asset_path = "/tmp/swimmer_2seg.xml"
+    many_segment_swimmer.gen_asset(n_segs=2, asset_path=asset_path)
+    c_env = gymnasium.make("Swimmer-v5", xml_file=asset_path)
+    os.remove(asset_path)
+
+    check_environments_match(env, c_env, num_steps=2000)

From db0baf5742e836df55d24fe5481673bdd1c92d1b Mon Sep 17 00:00:00 2001
From: Kallinteris Andreas
 <30759571+Kallinteris-Andreas@users.noreply.github.com>
Date: Sat, 9 Mar 2024 16:41:37 +0000
Subject: [PATCH 4/4] Update ma_multiagentswimmer.md (#212)

---
 docs/envs/MaMuJoCo/ma_multiagentswimmer.md | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/docs/envs/MaMuJoCo/ma_multiagentswimmer.md b/docs/envs/MaMuJoCo/ma_multiagentswimmer.md
index ce3657ca..90371ca2 100644
--- a/docs/envs/MaMuJoCo/ma_multiagentswimmer.md
+++ b/docs/envs/MaMuJoCo/ma_multiagentswimmer.md
@@ -2,9 +2,9 @@
 firstpage:
 lastpage:
 ---
-ManySegmentSwimmer
 
-# Swimmer
+
+# ManySegmentSwimmer
 ```{figure} figures/many_segment_swimmer.png
     :name: many_segment_swimmer
 ```