diff --git a/mujoco_playground/_src/locomotion/__init__.py b/mujoco_playground/_src/locomotion/__init__.py
index ce5d98287..a80c3d1c7 100644
--- a/mujoco_playground/_src/locomotion/__init__.py
+++ b/mujoco_playground/_src/locomotion/__init__.py
@@ -22,6 +22,7 @@
 from mujoco import mjx
 
 from mujoco_playground._src import mjx_env
+from mujoco_playground._src.locomotion.apollo import joystick as apollo_joystick
 from mujoco_playground._src.locomotion.barkour import joystick as barkour_joystick
 from mujoco_playground._src.locomotion.berkeley_humanoid import joystick as berkeley_humanoid_joystick
 from mujoco_playground._src.locomotion.berkeley_humanoid import randomize as berkeley_humanoid_randomize
@@ -41,6 +42,9 @@
 from mujoco_playground._src.locomotion.t1 import randomize as t1_randomize
 
 _envs = {
+    "ApolloJoystickFlatTerrain": functools.partial(
+        apollo_joystick.Joystick, task="flat_terrain"
+    ),
     "BarkourJoystick": barkour_joystick.Joystick,
     "BerkeleyHumanoidJoystickFlatTerrain": functools.partial(
         berkeley_humanoid_joystick.Joystick, task="flat_terrain"
@@ -82,6 +86,7 @@
 }
 
 _cfgs = {
+    "ApolloJoystickFlatTerrain": apollo_joystick.default_config,
     "BarkourJoystick": barkour_joystick.default_config,
     "BerkeleyHumanoidJoystickFlatTerrain": (
         berkeley_humanoid_joystick.default_config
diff --git a/mujoco_playground/_src/locomotion/apollo/__init__.py b/mujoco_playground/_src/locomotion/apollo/__init__.py
new file mode 100644
index 000000000..8d9506aab
--- /dev/null
+++ b/mujoco_playground/_src/locomotion/apollo/__init__.py
@@ -0,0 +1,14 @@
+# Copyright 2025 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
diff --git a/mujoco_playground/_src/locomotion/apollo/base.py b/mujoco_playground/_src/locomotion/apollo/base.py
new file mode 100644
index 000000000..28fec9b4e
--- /dev/null
+++ b/mujoco_playground/_src/locomotion/apollo/base.py
@@ -0,0 +1,162 @@
+# Copyright 2025 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Base classes for Apollo."""
+
+from typing import Any, Dict, Optional, Union
+
+import jax
+import jax.numpy as jp
+import mujoco
+import numpy as np
+from etils import epath
+from ml_collections import config_dict
+from mujoco import mjx
+
+from mujoco_playground._src import mjx_env
+from mujoco_playground._src.locomotion.apollo import constants as consts
+from mujoco_playground._src.collision import geoms_colliding
+
+
+def get_assets() -> Dict[str, bytes]:
+  assets = {}
+  # Playground assets.
+  mjx_env.update_assets(assets, consts.XML_DIR, "*.xml")
+  mjx_env.update_assets(assets, consts.XML_DIR / "assets")
+  # Menagerie assets.
+  path = mjx_env.MENAGERIE_PATH / "apptronik_apollo"
+  mjx_env.update_assets(assets, path, "*.xml")
+  mjx_env.update_assets(assets, path / "assets")
+  mjx_env.update_assets(assets, path / "assets" / "ability_hand")
+  return assets
+
+
+class ApolloEnv(mjx_env.MjxEnv):
+  """Base class for Apollo environments."""
+
+  def __init__(
+    self,
+    xml_path: str,
+    config: config_dict.ConfigDict,
+    config_overrides: Optional[Dict[str, Union[str, int, list[Any]]]] = None,
+  ) -> None:
+    super().__init__(config, config_overrides)
+
+    self._mj_model = mujoco.MjModel.from_xml_string(
+      epath.Path(xml_path).read_text(), assets=get_assets()
+    )
+    self._mj_model.opt.timestep = self.sim_dt
+
+    self._mj_model.vis.global_.offwidth = 3840
+    self._mj_model.vis.global_.offheight = 2160
+
+    self._mjx_model = mjx.put_model(self._mj_model)
+    self._xml_path = xml_path
+
+    self._init_q = jp.array(self._mj_model.keyframe("knees_bent").qpos)
+    self._default_ctrl = jp.array(self._mj_model.keyframe("knees_bent").ctrl)
+    self._default_pose = jp.array(self._mj_model.keyframe("knees_bent").qpos[7:])
+    self._actuator_torques = self.mj_model.jnt_actfrcrange[1:, 1]
+
+    # Body IDs.
+    self._torso_body_id = self._mj_model.body(consts.ROOT_BODY).id
+
+    # Geom IDs.
+    self._floor_geom_id = self._mj_model.geom("floor").id
+    self._left_feet_geom_id = np.array(
+      [self._mj_model.geom(name).id for name in consts.LEFT_FEET_GEOMS]
+    )
+    self._right_feet_geom_id = np.array(
+      [self._mj_model.geom(name).id for name in consts.RIGHT_FEET_GEOMS]
+    )
+    self._left_hand_geom_id = self._mj_model.geom("collision_l_hand_plate").id
+    self._right_hand_geom_id = self._mj_model.geom("collision_r_hand_plate").id
+    self._left_foot_geom_id = self._mj_model.geom("collision_l_sole").id
+    self._right_foot_geom_id = self._mj_model.geom("collision_r_sole").id
+    self._left_shin_geom_id = self._mj_model.geom("collision_capsule_body_l_shin").id
+    self._right_shin_geom_id = self._mj_model.geom("collision_capsule_body_r_shin").id
+    self._left_thigh_geom_id = self._mj_model.geom("collision_capsule_body_l_thigh").id
+    self._right_thigh_geom_id = self._mj_model.geom("collision_capsule_body_r_thigh").id
+
+    # Site IDs.
+    self._imu_site_id = self._mj_model.site("imu").id
+    self._feet_site_id = np.array(
+      [self._mj_model.site(name).id for name in consts.FEET_SITES]
+    )
+
+  # Sensor readings.
+
+  def get_gravity(self, data: mjx.Data) -> jax.Array:
+    """Return the gravity vector in the world frame."""
+    return mjx_env.get_sensor_data(self.mj_model, data, f"{consts.GRAVITY_SENSOR}")
+
+  def get_global_linvel(self, data: mjx.Data) -> jax.Array:
+    """Return the linear velocity of the robot in the world frame."""
+    return mjx_env.get_sensor_data(
+      self.mj_model, data, f"{consts.GLOBAL_LINVEL_SENSOR}"
+    )
+
+  def get_global_angvel(self, data: mjx.Data) -> jax.Array:
+    """Return the angular velocity of the robot in the world frame."""
+    return mjx_env.get_sensor_data(
+      self.mj_model, data, f"{consts.GLOBAL_ANGVEL_SENSOR}"
+    )
+
+  def get_local_linvel(self, data: mjx.Data) -> jax.Array:
+    """Return the linear velocity of the robot in the local frame."""
+    return mjx_env.get_sensor_data(self.mj_model, data, f"{consts.LOCAL_LINVEL_SENSOR}")
+
+  def get_accelerometer(self, data: mjx.Data) -> jax.Array:
+    """Return the accelerometer readings in the local frame."""
+    return mjx_env.get_sensor_data(
+      self.mj_model, data, f"{consts.ACCELEROMETER_SENSOR}"
+    )
+
+  def get_gyro(self, data: mjx.Data) -> jax.Array:
+    """Return the gyroscope readings in the local frame."""
+    return mjx_env.get_sensor_data(self.mj_model, data, f"{consts.GYRO_SENSOR}")
+
+  def get_feet_ground_contacts(self, data: mjx.Data) -> jax.Array:
+    """Return an array indicating whether each foot is in contact with the ground."""
+    left_feet_contact = jp.array(
+      [
+        geoms_colliding(data, geom_id, self._floor_geom_id)
+        for geom_id in self._left_feet_geom_id
+      ]
+    )
+    right_feet_contact = jp.array(
+      [
+        geoms_colliding(data, geom_id, self._floor_geom_id)
+        for geom_id in self._right_feet_geom_id
+      ]
+    )
+    return jp.hstack([jp.any(left_feet_contact), jp.any(right_feet_contact)])
+
+  # Accessors.
+
+  @property
+  def xml_path(self) -> str:
+    return self._xml_path
+
+  @property
+  def action_size(self) -> int:
+    return self._mjx_model.nu
+
+  @property
+  def mj_model(self) -> mujoco.MjModel:
+    return self._mj_model
+
+  @property
+  def mjx_model(self) -> mjx.Model:
+    return self._mjx_model
diff --git a/mujoco_playground/_src/locomotion/apollo/constants.py b/mujoco_playground/_src/locomotion/apollo/constants.py
new file mode 100644
index 000000000..3b6b590cd
--- /dev/null
+++ b/mujoco_playground/_src/locomotion/apollo/constants.py
@@ -0,0 +1,53 @@
+# Copyright 2025 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Constants for Apollo."""
+
+from etils import epath
+
+from mujoco_playground._src import mjx_env
+
+XML_DIR = mjx_env.ROOT_PATH / "locomotion" / "apollo" / "xmls"
+
+FEET_ONLY_FLAT_TERRAIN_XML = XML_DIR / "scene_mjx_feetonly_flat_terrain.xml"
+
+
+def task_to_xml(task_name: str) -> epath.Path:
+  return {
+    "flat_terrain": FEET_ONLY_FLAT_TERRAIN_XML,
+  }[task_name]
+
+
+FEET_SITES = [
+  "l_foot",
+  "r_foot",
+]
+
+HAND_SITES = [
+  "left_palm",
+  "right_palm",
+]
+
+LEFT_FEET_GEOMS = ["collision_l_sole"]
+RIGHT_FEET_GEOMS = ["collision_r_sole"]
+FEET_GEOMS = LEFT_FEET_GEOMS + RIGHT_FEET_GEOMS
+
+ROOT_BODY = "torso_link"
+
+GRAVITY_SENSOR = "upvector"
+GLOBAL_LINVEL_SENSOR = "global_linvel"
+GLOBAL_ANGVEL_SENSOR = "global_angvel"
+LOCAL_LINVEL_SENSOR = "local_linvel"
+ACCELEROMETER_SENSOR = "accelerometer"
+GYRO_SENSOR = "gyro"
diff --git a/mujoco_playground/_src/locomotion/apollo/joystick.py b/mujoco_playground/_src/locomotion/apollo/joystick.py
new file mode 100644
index 000000000..6472cc453
--- /dev/null
+++ b/mujoco_playground/_src/locomotion/apollo/joystick.py
@@ -0,0 +1,405 @@
+# Copyright 2025 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Joystick task for Apollo."""
+
+from typing import Any, Dict, Optional, Union
+
+import jax
+import jax.numpy as jp
+from ml_collections import config_dict
+from mujoco import mjx
+from mujoco.mjx._src import math
+
+from mujoco_playground._src import gait, mjx_env
+from mujoco_playground._src.locomotion.apollo import base
+from mujoco_playground._src.locomotion.apollo import constants as consts
+from mujoco_playground._src.collision import geoms_colliding
+
+
+def default_config() -> config_dict.ConfigDict:
+  return config_dict.create(
+    ctrl_dt=0.02,
+    sim_dt=0.005,
+    episode_length=1000,
+    action_repeat=1,
+    action_scale=0.5,
+    noise_config=config_dict.create(
+      level=1.0,
+      scales=config_dict.create(
+        joint_pos=0.03,
+        joint_vel=1.5,
+        gravity=0.05,
+        linvel=0.1,
+        gyro=0.2,
+      ),
+    ),
+    reward_config=config_dict.create(
+      scales=config_dict.create(
+        tracking=1.0,
+        lin_vel_z=0.0,
+        ang_vel_xy=-0.15,
+        orientation=-1.0,
+        torques=0.0,
+        action_rate=0.0,
+        energy=0.0,
+        feet_phase=1.0,
+        alive=0.0,
+        termination=0.0,
+        pose=-1.0,
+        collision=-1.0,
+      ),
+      tracking_sigma=0.25,
+      max_foot_height=0.12,
+    ),
+    push_config=config_dict.create(
+      enable=True,
+      interval_range=[5.0, 10.0],
+      magnitude_range=[0.1, 2.0],
+    ),
+    command_config=config_dict.create(
+      min=[-1.5, -0.8, -1.5],
+      max=[1.5, 0.8, 1.5],
+      zero_prob=[0.9, 0.25, 0.5],
+    ),
+  )
+
+
+class Joystick(base.ApolloEnv):
+  """Track a joystick command."""
+
+  def __init__(
+    self,
+    task: str = "flat_terrain",
+    config: config_dict.ConfigDict = default_config(),
+    config_overrides: Optional[Dict[str, Union[str, int, list[Any]]]] = None,
+  ):
+    super().__init__(
+      xml_path=consts.task_to_xml(task).as_posix(),
+      config=config,
+      config_overrides=config_overrides,
+    )
+
+    self._cmd_min = jp.array(self._config.command_config.min)
+    self._cmd_max = jp.array(self._config.command_config.max)
+    self._cmd_zero_prob = jp.array(self._config.command_config.zero_prob)
+
+    # fmt: off
+    self._weights = jp.array([
+        5.0, 5.0, 5.0,  # Torso.
+        1.0, 1.0, 1.0,  # Neck.
+        1.0, 1.0, 0.1, 1.0, 1.0, 1.0, 1.0,  # Left arm.
+        1.0, 1.0, 0.1, 1.0, 1.0, 1.0, 1.0,  # Right arm.
+        1.0, 1.0, 0.01, 0.01, 1.0, 1.0,  # Left leg.
+        1.0, 1.0, 0.01, 0.01, 1.0, 1.0,  # Right leg.
+    ])
+    # fmt: on
+
+  def reset(self, rng: jax.Array) -> mjx_env.State:
+    qpos = self._init_q
+    qvel = jp.zeros(self.mjx_model.nv)
+
+    # Randomize xy position and yaw, xy=+U(-0.5, 0.5), yaw=U(-pi, pi).
+    rng, key = jax.random.split(rng)
+    dxy = jax.random.uniform(key, (2,), minval=-0.5, maxval=0.5)
+    qpos = qpos.at[0:2].set(qpos[0:2] + dxy)
+    rng, key = jax.random.split(rng)
+    yaw = jax.random.uniform(key, (1,), minval=-3.14, maxval=3.14)
+    quat = math.axis_angle_to_quat(jp.array([0, 0, 1]), yaw)
+    new_quat = math.quat_mul(qpos[3:7], quat)
+    qpos = qpos.at[3:7].set(new_quat)
+
+    # Perturb initial joint angles, qpos[7:]=*U(0.5, 1.5)
+    rng, key = jax.random.split(rng)
+    qpos = qpos.at[7:].set(
+      qpos[7:]
+      * jax.random.uniform(key, (self.mjx_model.nq - 7,), minval=0.5, maxval=1.5)
+    )
+
+    # Perturb initial joint velocities, d(xyzrpy)=U(-0.5, 0.5)
+    rng, key = jax.random.split(rng)
+    qvel = qvel.at[0:6].set(jax.random.uniform(key, (6,), minval=-0.5, maxval=0.5))
+
+    data = mjx_env.init(self.mjx_model, qpos=qpos, qvel=qvel)
+
+    # Sample gait frequency =U(1.25, 1.75).
+    rng, key = jax.random.split(rng)
+    gait_freq = jax.random.uniform(key, (1,), minval=1.25, maxval=1.75)
+    phase_dt = 2 * jp.pi * self.dt * gait_freq
+    phase = jp.array([0, jp.pi])
+
+    # Sample push interval.
+    rng, push_rng = jax.random.split(rng)
+    push_interval = jax.random.uniform(
+      push_rng,
+      minval=self._config.push_config.interval_range[0],
+      maxval=self._config.push_config.interval_range[1],
+    )
+    push_interval_steps = jp.round(push_interval / self.dt).astype(jp.int32)
+
+    # Sample command.
+    rng, key1, key2 = jax.random.split(rng, 3)
+    time_until_next_cmd = jax.random.exponential(key1) * 5.0
+    steps_until_next_cmd = jp.round(time_until_next_cmd / self.dt).astype(jp.int32)
+    cmd = jax.random.uniform(
+      key2, shape=(3,), minval=self._cmd_min, maxval=self._cmd_max
+    )
+
+    info = {
+      "rng": rng,
+      "step": 0,
+      "command": cmd,
+      "steps_until_next_cmd": steps_until_next_cmd,
+      "last_act": jp.zeros(self.mjx_model.nu),
+      "phase_dt": phase_dt,
+      "phase": phase,
+      "push": jp.array([0.0, 0.0]),
+      "push_step": 0,
+      "push_interval_steps": push_interval_steps,
+      "filtered_linvel": jp.zeros(3),
+      "filtered_angvel": jp.zeros(3),
+    }
+    metrics = {
+      "termination/fall_termination": jp.zeros(()),
+    }
+    for k in self._config.reward_config.scales.keys():
+      metrics[f"reward/{k}"] = jp.zeros(())
+
+    obs = self._get_obs(data, info)
+    reward, done = jp.zeros(2)
+    return mjx_env.State(data, obs, reward, done, metrics, info)
+
+  def step(self, state: mjx_env.State, action: jax.Array) -> mjx_env.State:
+    state = self.apply_push(state)
+    motor_targets = self._default_ctrl + action * self._config.action_scale
+    data = mjx_env.step(self.mjx_model, state.data, motor_targets, self.n_substeps)
+
+    linvel = self.get_local_linvel(data)
+    state.info["filtered_linvel"] = linvel * 1.0 + state.info["filtered_linvel"] * 0.0
+    angvel = self.get_gyro(data)
+    state.info["filtered_angvel"] = angvel * 1.0 + state.info["filtered_angvel"] * 0.0
+
+    obs = self._get_obs(data, state.info)
+    done = self._get_termination(data, state.metrics)
+    rewards = self._get_reward(data, action, state.info, state.metrics, done)
+    rewards = {k: v * self._config.reward_config.scales[k] for k, v in rewards.items()}
+    reward = sum(rewards.values()) * self.dt
+
+    state.info["step"] += 1
+    phase_tp1 = state.info["phase"] + state.info["phase_dt"]
+    state.info["phase"] = jp.fmod(phase_tp1 + jp.pi, 2 * jp.pi) - jp.pi
+    state.info["phase"] = jp.where(
+      jp.linalg.norm(state.info["command"]) > 0.01,
+      state.info["phase"],
+      jp.ones(2) * jp.pi,
+    )
+    state.info["last_act"] = action
+    state.info["steps_until_next_cmd"] -= 1
+    state.info["rng"], key1, key2 = jax.random.split(state.info["rng"], 3)
+    state.info["command"] = jp.where(
+      state.info["steps_until_next_cmd"] <= 0,
+      self.sample_command(key1, state.info["command"]),
+      state.info["command"],
+    )
+    state.info["steps_until_next_cmd"] = jp.where(
+      done | (state.info["steps_until_next_cmd"] <= 0),
+      jp.round(jax.random.exponential(key2) * 5.0 / self.dt).astype(jp.int32),
+      state.info["steps_until_next_cmd"],
+    )
+    for k, v in rewards.items():
+      state.metrics[f"reward/{k}"] = v
+    done = done.astype(reward.dtype)
+    state = state.replace(data=data, obs=obs, reward=reward, done=done)
+    return state
+
+  def _get_termination(self, data: mjx.Data, metrics: dict[str, Any]) -> jax.Array:
+    fall_termination = self.get_gravity(data)[-1] < 0.0
+    metrics["termination/fall_termination"] = fall_termination.astype(jp.float32)
+    return fall_termination | jp.isnan(data.qpos).any() | jp.isnan(data.qvel).any()
+
+  def _apply_noise(
+    self, info: dict[str, Any], value: jax.Array, scale: float
+  ) -> jax.Array:
+    info["rng"], noise_rng = jax.random.split(info["rng"])
+    noise = 2 * jax.random.uniform(noise_rng, shape=value.shape) - 1
+    noisy_value = value + noise * self._config.noise_config.level * scale
+    return noisy_value
+
+  def _get_obs(self, data: mjx.Data, info: dict[str, Any]) -> mjx_env.Observation:
+    # Ground-truth observations.
+    gyro = self.get_gyro(data)
+    gravity = data.site_xmat[self._imu_site_id].T @ jp.array([0, 0, -1])
+    joint_angles = data.qpos[7:]
+    joint_vel = data.qvel[6:]
+    linvel = self.get_local_linvel(data)
+    phase = jp.concatenate([jp.cos(info["phase"]), jp.sin(info["phase"])])
+    root_pos = data.qpos[:3]
+    root_quat = data.qpos[3:7]
+    actuator_torques = data.actuator_force
+    # Noisy observations.
+    noise_scales = self._config.noise_config.scales
+    noisy_gyro = self._apply_noise(info, gyro, noise_scales.gyro)
+    noisy_gravity = self._apply_noise(info, gravity, noise_scales.gravity)
+    noisy_joint_angles = self._apply_noise(info, joint_angles, noise_scales.joint_pos)
+    noisy_joint_vel = self._apply_noise(info, joint_vel, noise_scales.joint_vel)
+    noisy_linvel = self._apply_noise(info, linvel, noise_scales.linvel)
+    state = jp.hstack(
+      [
+        noisy_linvel,
+        noisy_gyro,
+        noisy_gravity,
+        info["command"],
+        noisy_joint_angles - self._init_q[7:],
+        noisy_joint_vel,
+        info["last_act"],
+        phase,
+      ]
+    )
+    privileged_state = jp.hstack(
+      [
+        state,
+        # Unnoised.
+        gyro,
+        gravity,
+        linvel,
+        joint_angles - self._init_q[7:],
+        joint_vel,
+        # Extra.
+        actuator_torques,
+        root_pos,
+        root_quat,
+      ]
+    )
+    return {
+      "state": state,
+      "privileged_state": privileged_state,
+    }
+
+  def _get_reward(
+    self,
+    data: mjx.Data,
+    action: jax.Array,
+    info: dict[str, Any],
+    metrics: dict[str, Any],
+    done: jax.Array,
+  ) -> dict[str, jax.Array]:
+    del metrics  # Unused.
+    return {
+      "termination": done,
+      "alive": jp.array(1.0) - done,
+      "tracking": self._reward_tracking(info["command"], info),
+      "lin_vel_z": self._cost_lin_vel_z(info["filtered_linvel"]),
+      "ang_vel_xy": self._cost_ang_vel_xy(info["filtered_angvel"]),
+      "orientation": self._cost_orientation(self.get_gravity(data)),
+      "feet_phase": self._reward_feet_phase(data, info["phase"]),
+      "torques": self._cost_torques(data.actuator_force),
+      "action_rate": self._cost_action_rate(action, info["last_act"]),
+      "energy": self._cost_energy(data.qvel, data.actuator_force),
+      "collision": self._cost_collision(data),
+      "pose": self._cost_pose(data.qpos, info["command"]),
+    }
+
+  def _reward_tracking(self, commands: jax.Array, info: dict[str, Any]) -> jax.Array:
+    lin_vel_error = jp.sum(jp.square(commands[:2] - info["filtered_linvel"][:2]))
+    r_linvel = jp.exp(-lin_vel_error / self._config.reward_config.tracking_sigma)
+    ang_vel_error = jp.square(commands[2] - info["filtered_angvel"][2])
+    r_angvel = jp.exp(-ang_vel_error / self._config.reward_config.tracking_sigma)
+    return r_linvel + 0.5 * r_angvel
+
+  def _cost_lin_vel_z(self, local_linvel) -> jax.Array:
+    return jp.square(local_linvel[2])
+
+  def _cost_ang_vel_xy(self, local_angvel) -> jax.Array:
+    return jp.sum(jp.square(local_angvel[:2]))
+
+  def _cost_orientation(self, torso_zaxis: jax.Array) -> jax.Array:
+    return jp.sum(jp.square(torso_zaxis[:2]))
+
+  def _cost_torques(self, torques: jax.Array) -> jax.Array:
+    return jp.sum(jp.abs(torques))
+
+  def _cost_energy(self, qvel: jax.Array, qfrc_actuator: jax.Array) -> jax.Array:
+    torques = qfrc_actuator / self._actuator_torques
+    return jp.sum(jp.abs(qvel[6:] * torques))
+
+  def _cost_action_rate(self, act: jax.Array, last_act: jax.Array) -> jax.Array:
+    return jp.sum(jp.square(act - last_act))
+
+  def _cost_collision(self, data: mjx.Data) -> jax.Array:
+    # Hand - thigh.
+    c = geoms_colliding(data, self._left_hand_geom_id, self._left_thigh_geom_id)
+    c |= geoms_colliding(data, self._right_hand_geom_id, self._right_thigh_geom_id)
+    # Foot - foot.
+    c |= geoms_colliding(data, self._left_foot_geom_id, self._right_foot_geom_id)
+    # Shin - shin.
+    c |= geoms_colliding(
+      data,
+      self._left_shin_geom_id,
+      self._right_shin_geom_id,
+    )
+    # Thigh - thigh.
+    c |= geoms_colliding(
+      data,
+      self._left_thigh_geom_id,
+      self._right_thigh_geom_id,
+    )
+    return jp.any(c)
+
+  def _cost_pose(self, qpos: jax.Array, commands: jax.Array) -> jax.Array:
+    # Uniform weights when standing still.
+    weights = jp.where(
+      jp.linalg.norm(commands) < 0.01,
+      jp.ones_like(self._weights),
+      self._weights,
+    )
+    # Reduce hip roll weight when lateral command is high.
+    lateral_cmd = jp.abs(commands[1])
+    hip_roll_weight = jp.where(lateral_cmd > 0.3, 0.01, 1.0)
+    weights = weights.at[21].set(hip_roll_weight)
+    weights = weights.at[27].set(hip_roll_weight)
+    return jp.sum(jp.square(qpos[7:] - self._init_q[7:]) * weights)
+
+  def _reward_feet_phase(self, data: mjx.Data, phase: jax.Array) -> jax.Array:
+    foot_z = data.site_xpos[self._feet_site_id][..., -1]
+    rz = gait.get_rz(phase, swing_height=self._config.reward_config.max_foot_height)
+    error = jp.sum(jp.square(foot_z - rz))
+    return jp.exp(-error / 0.01)
+
+  def sample_command(self, rng: jax.Array, x_k: jax.Array) -> jax.Array:
+    rng, y_rng, w_rng, z_rng = jax.random.split(rng, 4)
+    y_k = jax.random.uniform(
+      y_rng, shape=(3,), minval=self._cmd_min, maxval=self._cmd_max
+    )
+    z_k = jax.random.bernoulli(z_rng, self._cmd_zero_prob, shape=(3,))
+    w_k = jax.random.bernoulli(w_rng, 0.5, shape=(3,))
+    return x_k - w_k * (x_k - y_k * z_k)
+
+  def apply_push(self, state: mjx_env.State) -> mjx_env.State:
+    state.info["rng"], push1_rng, push2_rng = jax.random.split(state.info["rng"], 3)
+    push_theta = jax.random.uniform(push1_rng, maxval=2 * jp.pi)
+    push_magnitude = jax.random.uniform(
+      push2_rng,
+      minval=self._config.push_config.magnitude_range[0],
+      maxval=self._config.push_config.magnitude_range[1],
+    )
+    push = jp.array([jp.cos(push_theta), jp.sin(push_theta)])
+    push *= jp.mod(state.info["push_step"] + 1, state.info["push_interval_steps"]) == 0
+    push *= self._config.push_config.enable
+    state.info["push"] = push
+    state.info["push_step"] += 1
+    qvel = state.data.qvel
+    qvel = qvel.at[:2].set(push * push_magnitude + qvel[:2])
+    data = state.data.replace(qvel=qvel)
+    state = state.replace(data=data)
+    return state
diff --git a/mujoco_playground/_src/locomotion/apollo/xmls/apollo_mjx_feetonly.xml b/mujoco_playground/_src/locomotion/apollo/xmls/apollo_mjx_feetonly.xml
new file mode 100644
index 000000000..7ef7d76c0
--- /dev/null
+++ b/mujoco_playground/_src/locomotion/apollo/xmls/apollo_mjx_feetonly.xml
@@ -0,0 +1,538 @@
+<mujoco model="apptronik_apollo">
+  <compiler angle="radian" eulerseq="zyx" texturedir="assets" autolimits="true"/>
+
+  <option iterations="3" ls_iterations="5" timestep=".005" integrator="implicitfast">
+    <flag eulerdamp="disable"/>
+  </option>
+
+  <default>
+    <default class="apollo">
+      <equality solref="0.005 1" solimp="0.99 0.999 0.00001"/>
+
+      <joint/>
+      <position inheritrange="1"/>
+
+      <default class="neck">
+        <default class="neck_roll">
+          <position kp="20" kv="5"/>
+        </default>
+        <default class="neck_pitch">
+          <position kp="20" kv="5"/>
+        </default>
+        <default class="neck_yaw">
+          <position kp="20" kv="5"/>
+        </default>
+      </default>
+      <default class="torso">
+        <position kp="200" kv="20"/>
+        <default class="torso_pitch">
+        </default>
+        <default class="torso_roll">
+        </default>
+        <default class="torso_yaw">
+        </default>
+      </default>
+      <default class="hip">
+        <position kp="200" kv="20"/>
+        <default class="hip_ie">
+        </default>
+        <default class="hip_aa">
+        </default>
+        <default class="hip_fe">
+        </default>
+      </default>
+      <default class="knee">
+        <position kp="200" kv="20"/>
+      </default>
+      <default class="ankle">
+        <default class="ankle_pitch">
+          <position kp="50" kv="5"/>
+        </default>
+        <default class="ankle_roll">
+          <position kp="50" kv="5"/>
+        </default>
+      </default>
+      <default class="shoulder">
+        <position kp="50" kv="5"/>
+        <default class="shoulder_aa">
+        </default>
+        <default class="shoulder_ie">
+        </default>
+        <default class="shoulder_fe">
+        </default>
+      </default>
+      <default class="elbow">
+        <position kp="20" kv="2"/>
+      </default>
+      <default class="wrist">
+        <position kp="20" kv="2"/>
+        <default class="wrist_roll">
+        </default>
+        <default class="wrist_yaw">
+        </default>
+        <default class="wrist_pitch">
+        </default>
+      </default>
+
+      <geom contype="0" conaffinity="0" condim="1" margin="0.0005" solref="0.005 1"/>
+      <default class="visual">
+        <geom type="mesh" group="2"/>
+        <default class="visual_dark">
+          <geom rgba="0.0980392 0.0980392 0.0980392 1"/>
+        </default>
+        <default class="visual_light">
+          <geom rgba="0.960784 0.960784 0.952941 1"/>
+        </default>
+      </default>
+      <default class="collision">
+        <geom group="3" rgba="0 1 0 0.4"/>
+        <default class="foot_collision">
+        </default>
+      </default>
+    </default>
+
+    <site group="5" rgba="1 0 0 1" size="0.01"/>
+  </default>
+
+  <asset>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/neck_mount_fix_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/neck_yaw_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/afh_2_1_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/torso_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/battery_mount_fix.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/torso_pitch_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/torso_roll_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/pelvis_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_shoulder_aa_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_shoulder_ie_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_shoulder_fe_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_elbow_fe_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_wrist_roll_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_wrist_yaw_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_wrist_pitch_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/wrist_adapter.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/wristmesh.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/FB_palm_ref.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/idx-F1.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/idx-F2.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/thumb-F1.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/thumb-F2-left.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_shoulder_aa_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_shoulder_ie_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_shoulder_fe_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_elbow_fe_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_wrist_roll_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_wrist_yaw_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_wrist_pitch_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/FB_palm_ref_MIR.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/thumb-F1-MIR.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/ability_hand/thumb-F2-right.STL"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_hip_ie_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_hip_aa_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_hip_fe_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_knee_fe_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_ankle_ie_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/l_foot_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_hip_ie_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_hip_aa_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_hip_fe_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_knee_fe_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_ankle_ie_link.stl"/>
+    <mesh file="../../../../external_deps/mujoco_menagerie/apptronik_apollo/assets/r_foot_link.stl"/>
+  </asset>
+
+  <worldbody>
+    <light name="spotlight" mode="targetbodycom" target="torso_link" pos="0 -2 4" exponent="20"/>
+    <body name="base_link" pos="0 0 1.2813" childclass="apollo">
+      <camera name="track" pos="1.844 -1.323 .5" xyaxes="0.587 0.809 0.000 -0.218 0.158 0.963" mode="trackcom"/>
+      <body name="torso_oak_d_pro_w_rear_frame_link" pos="-0.164306 5e-08 0.0140886" euler="3.14 1.0472229 0"
+        gravcomp="0">
+        <camera name="torso_oak_d_pro_w_rear" mode="fixed" euler="-1.57 0 1.57" fovy="70.0"/>
+        <inertial pos="0 0 0" mass="0.115"
+          diaginertia="0.00014442322916666668 3.8901145833333344e-05 0.00012639458333333335"/>
+      </body>
+      <body name="torso_oak_d_pro_w_front_frame_link" pos="0.087306 -5e-08 0.0480886"
+        euler="-3.77771e-14 1.0472 -4.97386e-14" gravcomp="0">
+        <camera name="torso_oak_d_pro_w_front" mode="fixed" euler="-1.57 0 1.57" fovy="70.0"/>
+        <inertial pos="0 0 0" mass="0.115"
+          diaginertia="0.00014442322916666668 3.8901145833333344e-05 0.00012639458333333335"/>
+      </body>
+      <inertial pos="-0.0466459 -2.50736e-05 -0.0721416" quat="0.661991 0.662086 0.248682 -0.248127" mass="7.43582"
+        diaginertia="0.0633318 0.0512326 0.0281854"/>
+      <freejoint name="floating_base"/>
+      <geom class="visual_light" mesh="pelvis_link"/>
+      <geom name="collision_capsule_body_pelvis" size="0.1 0.09" pos="-0.06 0 -0.08" quat="0.707388 0.706825 0 0"
+        type="capsule" class="collision"/>
+      <body name="torso_roll_link" pos="0.03 0 0.03125">
+        <inertial pos="-0.0337439 7.47864e-09 -0.0199137" quat="0.5297 0.511275 -0.470427 0.486532" mass="0.824114"
+          diaginertia="0.00159405 0.00123171 0.000760001"/>
+        <joint name="torso_yaw" axis="0 0 -1" range="-0.829031 0.829031" actuatorfrcrange="-120 120"
+          frictionloss="0.7" armature="0.231424" class="torso_yaw"/>
+        <geom class="visual_dark" mesh="torso_roll_link"/>
+        <body name="torso_pitch_link" pos="0 0 0">
+          <inertial pos="-0.0120797 5.39687e-05 -0.00065376" quat="0.49026 0.489868 -0.50995 0.509534" mass="0.313137"
+            diaginertia="0.000415493 0.000345069 9.17604e-05"/>
+          <joint name="torso_roll" axis="1 0 0" range="-0.20944 0.20944" actuatorfrcrange="-414 414"
+            frictionloss="4.53" armature="1.56493" class="torso_roll"/>
+          <geom class="visual_dark" mesh="torso_pitch_link"/>
+          <body name="torso_link" pos="0 0 0">
+            <inertial pos="-0.0484952 0.00143204 0.185535" quat="0.702792 0.0157426 -6.68569e-05 0.711221"
+              mass="19.3408" diaginertia="0.303595 0.272287 0.22035"/>
+            <joint name="torso_pitch" axis="0 1 0" range="-0.305433 1.35263" actuatorfrcrange="-315 315"
+              frictionloss="13.15" armature="0.970692" class="torso_pitch"/>
+            <site name="imu" pos="0.037 5.54705e-16 0.093624"/>
+            <geom class="visual_light" mesh="torso_link"/>
+            <geom name="collision_cylinder_torso" size="0.16 0.05" pos="-0.045 0 0.2" type="capsule" class="collision"/>
+            <geom class="visual_dark" mesh="neck_mount_fix_link"/>
+            <geom class="visual_dark" mesh="battery_mount_fix"/>
+            <body name="neck_yaw_link" pos="-0.0303298 0 0.32841" quat="0.991445 0 0.130526 0">
+              <inertial pos="-0.0110616 0.000438589 0.066541" quat="0.715974 -0.0707674 -0.0795701 0.689958"
+                mass="0.707753" diaginertia="0.00278981 0.002738 0.00071974"/>
+              <joint name="neck_yaw" axis="0 0 1" range="-1.65806 1.65806" actuatorfrcrange="-10.6 10.6"
+                frictionloss="0" armature="0.0368" class="neck_yaw"/>
+              <geom class="visual_dark" mesh="neck_yaw_link"/>
+              <body name="neck_roll_link" pos="-0.025 0 0.2" quat="1.32679e-06 -1 0 0">
+                <inertial pos="9.66662e-05 -0.000233736 -0.000463806" quat="0.000426355 0.703652 0.00178423 0.710542"
+                  mass="0.0189001" diaginertia="1.89727e-06 1.24254e-06 1.0322e-06"/>
+                <joint name="neck_roll" axis="1 0 0" range="-0.785398 0.785398" actuatorfrcrange="-34.2 34.2"
+                 frictionloss="0" armature="0.00305531" class="neck_roll"/>
+                <body name="neck_pitch_link" quat="1.17527e-06 0.885799 6.15724e-07 -0.464069">
+                  <inertial pos="0.0412474 -0.00081671 0.0152493" quat="0.350337 0.613318 0.617311 0.346457"
+                    mass="1.78084" diaginertia="0.0135957 0.0109432 0.00697581"/>
+                  <joint name="neck_pitch" axis="0 1 0" range="-0.261799 0.523599" actuatorfrcrange="-34.2 34.2"
+                   frictionloss="0" armature="0.00256298" class="neck_pitch"/>
+                  <geom quat="0.938794 0 0.344479 0" class="visual_light" mesh="afh_2_1_link"/>
+                </body>
+              </body>
+            </body>
+            <body name="l_shoulder_aa_link" pos="-0.05 0.2 0.32">
+              <inertial pos="0.000169922 0.0025177 -0.0190065" quat="0.710165 -0.0144759 0.023056 0.703508"
+                mass="0.0980048" diaginertia="4.61576e-05 3.97046e-05 1.43504e-05"/>
+              <joint name="l_shoulder_aa" axis="1 0 0" range="-0.122173 1.6057" actuatorfrcrange="-78 78"
+                frictionloss="2." armature="0.0982771" class="shoulder_aa"/>
+              <geom class="visual_dark" mesh="l_shoulder_aa_link"/>
+              <body name="l_shoulder_ie_link" pos="0 0 0">
+                <inertial pos="-0.00799772 0.0154729 -0.0231746" quat="0.0914838 0.586016 -0.671384 0.444364"
+                  mass="0.451281" diaginertia="0.00069896 0.000628486 0.000278066"/>
+                <joint name="l_shoulder_ie" axis="0 0 1" range="-0.471239 0.471239" actuatorfrcrange="-67 67" frictionloss="1.48" armature="0.0823104" class="shoulder_ie"/>
+                <geom class="visual_dark" mesh="l_shoulder_ie_link"/>
+                <body name="l_shoulder_fe_link" pos="0.0104822 0.03912 0" quat="0.991445 0 0 -0.130526">
+                  <inertial pos="0.00453031 0.00134632 -0.143556" quat="0.707095 0.0140891 -0.00274087 0.706973"
+                    mass="3.51271" diaginertia="0.0284589 0.0232812 0.00763948"/>
+                  <joint name="l_shoulder_fe" axis="0 1 0" range="-2.18166 0.610865" actuatorfrcrange="-114 114"
+                   frictionloss="1.94" armature="0.112768" class="shoulder_fe"/>
+                  <geom class="visual_light" mesh="l_shoulder_fe_link"/>
+                  <geom name="collision_capsule_body_l_arm_1" size="0.055 0.14" pos="-0.005 0.01 -0.16" type="capsule"
+                    class="collision"/>
+                  <geom name="collision_capsule_body_l_arm_2" size="0.055 0.055" pos="0.05 0.005 -0.125" type="capsule"
+                    class="collision"/>
+                  <geom name="collision_capsule_body_l_arm_3" size="0.055 0.02" pos="-0.06 0.0025 -0.13" type="capsule"
+                    class="collision"/>
+                  <body name="l_elbow_fe_link" pos="0.025 0 -0.315">
+                    <inertial pos="-0.0407636 -0.000100019 -0.0277184" quat="0.446501 0.557407 0.539502 0.445951"
+                      mass="0.947642" diaginertia="0.00105876 0.000944065 0.00076124"/>
+                    <joint name="l_elbow_fe" axis="0 1 0" range="-2.61799 0.174533" actuatorfrcrange="-114 114"
+                     frictionloss="2.55" armature="0.102645" class="elbow"/>
+                    <geom class="visual_dark" mesh="l_elbow_fe_link"/>
+                    <body name="l_wrist_roll_link" pos="-0.04 0 -0.06" quat="0.707105 0 0 0.707108">
+                      <inertial pos="0.0088493 0.000434657 -0.071867" quat="0.701782 -0.0503482 -0.0435035 0.709278"
+                        mass="0.694478" diaginertia="0.00294512 0.00284275 0.000723985"/>
+                      <joint name="l_wrist_roll" axis="0 0 1" range="-1.65806 1.65806" actuatorfrcrange="-10.6 10.6"
+                       frictionloss="0" armature="0.0368" class="wrist_roll"/>
+                      <geom class="visual_light" mesh="l_wrist_roll_link"/>
+                      <geom name="collision_cylinder_l_arm" size="0.04755 0.1076" pos="0 0 -0.1" type="capsule"
+                        class="collision"/>
+                      <body name="l_wrist_yaw_link" pos="0.025 0 -0.2">
+                        <inertial pos="-9.66662e-05 0.000233736 -0.000463806"
+                          quat="-0.00178423 0.710542 -0.000426355 0.703652" mass="0.0189001"
+                          diaginertia="1.89727e-06 1.24254e-06 1.0322e-06"/>
+                        <joint name="l_wrist_yaw" axis="1 0 0" range="-0.698 0.698" actuatorfrcrange="-34.2 34.2"
+                         frictionloss="0" armature="0.00329371" class="wrist_yaw"/>
+                        <geom class="visual_dark" mesh="l_wrist_yaw_link"/>
+                        <body name="l_wrist_pitch_link" quat="0.707105 0 0 -0.707108">
+                          <inertial pos="0.0071177 -0.038442 -0.0669519" quat="0.614861 0.00892233 0.0323416 0.787921"
+                            mass="0.806883" diaginertia="0.00459474 0.00452816 0.00206219"/>
+                          <joint name="l_wrist_pitch" axis="1 0 0" range="-0.75 1.588" actuatorfrcrange="-34.2 34.2"
+                           frictionloss="0" armature="0.00288074" class="wrist_pitch"/>
+                          <geom class="visual_dark" mesh="l_wrist_pitch_link"/>
+                          <geom name="wrist_adapter_mesh" pos="0 -0.0297676 -0.0277946" class="visual_dark"
+                            mesh="wrist_adapter"/>
+                          <geom name="wrist_mesh" pos="0 -0.0343657 -0.0392954" quat="0.130526 0.991445 0 0"
+                            class="visual_dark" mesh="wristmesh"/>
+                          <geom name="palm_mesh" pos="0.0240477 -0.0463856 -0.0695448"
+                            quat="0.00516808 0.0439309 0.130372 0.990478" class="visual_dark" mesh="FB_palm_ref"/>
+                          <geom name="index_mesh_1" pos="0.0279216 -0.0502244 -0.134299"
+                            quat="0.0355504 -0.725304 0.0429902 0.686165" class="visual_dark" mesh="idx-F1"/>
+                          <frame pos="0.0296624 -0.053984 -0.172686" euler="0 0 -45">
+                            <geom name="index_mesh_2" quat="0.00654576 -0.722842 0.0735774 0.687054" class="visual_dark" mesh="idx-F2"/>
+                          </frame>
+                          <geom name="middle_mesh_1" pos="0.00841718 -0.0488804 -0.137964" quat="0.0114639 -0.705931 0.0210022 0.707876" class="visual_dark" mesh="idx-F1"/>
+                          <frame pos="0.00814998 -0.0526507 -0.176389" euler="0 0 -45">
+                            <geom name="middle_mesh_2" quat="-0.018436 -0.704415 0.0507911 0.707729" class="visual_dark" mesh="idx-F2"/>
+                          </frame>
+                          <geom name="ring_mesh_1" pos="-0.0117529 -0.049354 -0.135394" quat="-0.0126044 -0.685391 -0.0036555 0.728057" class="visual_dark" mesh="idx-F1"/>
+                          <frame pos="-0.0139914 -0.0531239 -0.173755" euler="0 0 -45">
+                            <geom name="ring_mesh_2" quat="-0.0433349 -0.684934 0.025288 0.726875" class="visual_dark" mesh="idx-F2"/>
+                          </frame>
+                          <geom name="pinky_mesh_1" pos="-0.0308633 -0.0509308 -0.128792" quat="-0.0350419 -0.683018 -0.0274385 0.729045" class="visual_dark" mesh="idx-F1"/>
+                          <frame pos="-0.0330569 -0.0546993 -0.167156" euler="0 0 -45">
+                            <geom name="pinky_mesh_2" quat="-0.0657942 -0.683567 0.00142601 0.726915" class="visual_dark" mesh="idx-F2"/>
+                          </frame>
+                          <geom name="thumb_mesh_1" pos="0.0240477 -0.0463856 -0.0695448" quat="-0.986553 0.125649 -0.0560269 -0.0882391" class="visual_dark" mesh="thumb-F1"/>
+                          <geom name="thumb_mesh_2" pos="0.0499644 -0.0457352 -0.0874305" quat="0.500891 -0.859176 -0.0358978 0.0981657" class="visual_dark" mesh="thumb-F2-left"/>
+                          <geom name="collision_l_hand_plate" size="0.041 0.02 0.083" pos="0.00749988 -0.025 -0.112" type="box" class="collision"/>
+                        </body>
+                      </body>
+                    </body>
+                  </body>
+                </body>
+              </body>
+            </body>
+            <body name="r_shoulder_aa_link" pos="-0.05 -0.2 0.32">
+              <inertial pos="0.000169922 0.0025177 -0.0190065" quat="0.710165 -0.0144759 0.023056 0.703508"
+                mass="0.0980048" diaginertia="4.61576e-05 3.97046e-05 1.43504e-05"/>
+              <joint name="r_shoulder_aa" axis="1 0 0" range="-1.6057 0.122173" actuatorfrcrange="-78 78" frictionloss="2." armature="0.098338" class="shoulder_aa"/>
+              <geom class="visual_dark" mesh="r_shoulder_aa_link"/>
+              <body name="r_shoulder_ie_link" pos="0 0 0">
+                <inertial pos="-0.00800045 -0.0154894 -0.0231814" quat="0.583857 0.088589 -0.445504 0.672897"
+                  mass="0.451079" diaginertia="0.000700361 0.00062725 0.000277886"/>
+                <joint name="r_shoulder_ie" axis="0 0 1" range="-0.471239 0.471239" actuatorfrcrange="-67 67" frictionloss="1.48" armature="0.0823191" class="shoulder_ie"/>
+                <geom class="visual_dark" mesh="r_shoulder_ie_link"/>
+                <body name="r_shoulder_fe_link" pos="0.0104822 -0.03912 0" quat="0.991445 0 0 0.130526">
+                  <inertial pos="0.00420186 -0.00125575 -0.142983" quat="0.7032 -0.00225527 0.011754 0.710892"
+                    mass="3.50359" diaginertia="0.0282519 0.0230724 0.00763457"/>
+                  <joint name="r_shoulder_fe" axis="0 1 0" range="-2.18166 0.610865" actuatorfrcrange="-114 114"
+                   frictionloss="1.94" armature="0.112768" class="shoulder_fe"/>
+                  <geom class="visual_light" mesh="r_shoulder_fe_link"/>
+                  <geom name="collision_capsule_body_r_arm_1" size="0.055 0.14" pos="-0.005 -0.01 -0.16" type="capsule"
+                    class="collision"/>
+                  <geom name="collision_capsule_body_r_arm_2" size="0.055 0.055" pos="0.05 -0.005 -0.125" type="capsule"
+                    class="collision"/>
+                  <geom name="collision_capsule_body_r_arm_3" size="0.055 0.02" pos="-0.06 -0.0025 -0.13" type="capsule"
+                    class="collision"/>
+                  <body name="r_elbow_fe_link" pos="0.025 0 -0.315">
+                    <inertial pos="-0.0407591 0.000134025 -0.0277185" quat="0.458533 0.527215 0.568785 0.433907"
+                      mass="0.947653" diaginertia="0.00105948 0.000943838 0.000761313"/>
+                    <joint name="r_elbow_fe" axis="0 1 0" range="-2.61799 0.174533" actuatorfrcrange="-114 114"
+                     frictionloss="2.55" armature="0.102645" class="elbow"/>
+                    <geom class="visual_dark" mesh="r_elbow_fe_link"/>
+                    <body name="r_wrist_roll_link" pos="-0.04 0 -0.06" quat="0.707105 0 0 -0.707108">
+                      <inertial pos="0.00887138 -0.000263913 -0.0718159" quat="0.698707 -0.0449538 -0.0486448 0.712336"
+                        mass="0.695137" diaginertia="0.00294733 0.00284457 0.000724756"/>
+                      <joint name="r_wrist_roll" axis="0 0 1" range="-1.65806 1.65806" actuatorfrcrange="-10.6 10.6"
+                       frictionloss="0" armature="0.0368" class="wrist_roll"/>
+                      <geom class="visual_light" mesh="r_wrist_roll_link"/>
+                      <geom name="collision_cylinder_r_arm" size="0.04755 0.1076" pos="0 0 -0.1" type="capsule"
+                        class="collision"/>
+                      <body name="r_wrist_yaw_link" pos="0.025 0 -0.2" quat="1.32679e-06 0 0 -1">
+                        <inertial pos="9.66662e-05 0.000233736 -0.000463806"
+                          quat="-0.00044002 0.703652 -0.00179716 0.710542" mass="0.0189001"
+                          diaginertia="1.89727e-06 1.24254e-06 1.0322e-06"/>
+                        <joint name="r_wrist_yaw" axis="1 0 0" range="-0.698 0.698" actuatorfrcrange="-34.2 34.2"
+                         frictionloss="0" armature="0.0032937" class="wrist_yaw"/>
+                        <geom class="visual_dark" mesh="r_wrist_yaw_link"/>
+                        <body name="r_wrist_pitch_link" quat="0.707105 0 0 -0.707108">
+                          <inertial pos="0.0181202 0.0388729 -0.0688824" quat="0.630263 -0.0221958 -0.0501406 0.774443" mass="0.806683" diaginertia="0.00526208 0.00452156 0.0026899"/>
+                          <joint name="r_wrist_pitch" axis="1 0 0" range="-1.588 0.75" actuatorfrcrange="-34.2 34.2" damping="10" frictionloss="0" armature="0.00288075"/>
+                          <geom class="visual_dark" mesh="r_wrist_pitch_link"/>
+                          <geom pos="0 0.0297676 -0.0277946" quat="1.32679e-06 0 0 1" class="visual_dark" mesh="wrist_adapter"/>
+                          <geom pos="1.22016e-08 0.0343657 -0.0392954" quat="1.73181e-07 1.31544e-06 0.991445 0.130526" class="visual_dark" mesh="wristmesh"/>
+                          <geom pos="0.0240477 0.0463855 -0.0695448" quat="0.990478 0.130372 0.0439307 0.00516677" class="visual_dark" mesh="FB_palm_ref_MIR"/>
+                          <geom pos="0.0279216 0.0502243 -0.134299" quat="0.725304 -0.0355495 0.686165 0.0429892" class="visual_dark" mesh="idx-F1"/>
+                          <frame pos="0.0296625 0.053984 -0.172686" euler="0 0 45">
+                            <geom quat="0.722842 -0.00654484 0.687054 0.0735764" class="visual_dark" mesh="idx-F2"/>
+                          </frame>
+                          <geom pos="0.00841723 0.0488804 -0.137964" quat="0.705931 -0.0114629 0.707876 0.0210013" class="visual_dark" mesh="idx-F1"/>
+                          <frame pos="0.00815005 0.0526507 -0.176389" euler="0 0 45">
+                            <geom quat="0.704415 0.018437 0.707729 0.0507901" class="visual_dark" mesh="idx-F2"/>
+                          </frame>
+                          <geom pos="-0.0117529 0.0493541 -0.135394" quat="0.685391 0.0126053 0.728057 -0.00365641" class="visual_dark" mesh="idx-F1"/>
+                          <frame pos="-0.0139913 0.053124 -0.173755" euler="0 0 45">
+                            <geom quat="0.684934 0.0433359 0.726875 0.0252871" class="visual_dark" mesh="idx-F2"/>
+                          </frame>
+                          <geom pos="-0.0308632 0.0509308 -0.128792" quat="0.683018 0.0350429 0.729045 -0.0274394" class="visual_dark" mesh="idx-F1"/>
+                          <frame pos="-0.0330568 0.0546993 -0.167156" euler="0 0 45">
+                            <geom quat="0.683567 0.0657951 0.726915 0.00142511" class="visual_dark" mesh="idx-F2"/>
+                          </frame>
+                          <geom pos="0.0240477 0.0463855 -0.0695448" quat="-0.125649 0.986553 -0.0882404 -0.0560268" class="visual_dark" mesh="thumb-F1-MIR"/>
+                          <geom pos="0.0499644 0.0457351 -0.0874305" quat="-0.859175 0.500891 -0.0981664 0.0358989" class="visual_dark" mesh="thumb-F2-right"/>
+                          <geom name="collision_r_hand_plate" size="0.041 0.02 0.083" pos="0.00749988 0.025 -0.112" type="box" class="collision"/>
+                        </body>
+                      </body>
+                    </body>
+                  </body>
+                </body>
+              </body>
+            </body>
+          </body>
+        </body>
+      </body>
+      <body name="l_hip_ie_link" pos="-0.02 0.11 -0.16875" quat="0.957662 0.126078 -0.256605 0.0337826">
+        <inertial pos="-0.0275726 0.000155527 0.0265849" quat="-0.0182885 0.43376 -0.029543 0.900358" mass="1.49972"
+          diaginertia="0.00446385 0.00343018 0.00205254"/>
+        <joint name="l_hip_ie" axis="0 0 1" range="-0.567232 1.09083" actuatorfrcrange="-120 120"
+          frictionloss="7.95" armature="0.231424" class="hip_ie"/>
+        <geom class="visual_dark" mesh="l_hip_ie_link"/>
+        <body name="l_hip_aa_link" pos="0 0 0">
+          <inertial pos="0.000193883 0.00068757 0.00240456" quat="0.488822 0.400587 -0.484645 0.604733" mass="0.429858"
+            diaginertia="0.000370659 0.000322451 0.000129015"/>
+          <joint name="l_hip_aa" axis="1 0 0" range="-0.218166 0.741765" actuatorfrcrange="-494 494"
+            frictionloss="7.0" armature="0.399395" class="hip_aa"/>
+          <geom class="visual_dark" mesh="l_hip_aa_link"/>
+          <body name="l_hip_fe_link" quat="0.957662 -0.126079 0.256605 -0.0337828">
+            <inertial pos="0.0065559 0.00346415 -0.207233" quat="0.864334 0.00804176 0.0489557 0.500466" mass="10.7833"
+              diaginertia="0.124113 0.120556 0.0499696"/>
+            <joint name="l_hip_fe" axis="0 1 0" range="-1.85005 0.476475" actuatorfrcrange="-342 342" frictionloss="21.06" armature="0.187096" class="hip_fe"/>
+            <geom class="visual_light" mesh="l_hip_fe_link"/>
+            <geom name="collision_capsule_body_l_thigh" size="0.105 0.1" pos="0 0.005 -0.215" type="capsule"
+              class="collision"/>
+            <body name="l_knee_fe_link" pos="-0.05 0 -0.425">
+              <inertial pos="0.043534 0.00505054 -0.152417" quat="0.917057 0.00954505 0.0113608 0.398479" mass="4.57515"
+                diaginertia="0.0639569 0.0630895 0.0108036"/>
+              <joint name="l_knee_fe" axis="0 1 0" range="0 2.61799" actuatorfrcrange="-336 336"
+                frictionloss="7.7" armature="0.292264" class="knee"/>
+              <geom class="visual_light" mesh="l_knee_fe_link"/>
+              <geom name="collision_capsule_body_l_shin" size="0.071 0.15" pos="0.0476 0.0061 -0.19"
+                quat="0.998048 0 0.0624593 0" type="capsule" class="collision"/>
+              <body name="l_ankle_ie_link" pos="0.05 0 -0.425" quat="0.987672 0.0864102 -0.130029 0.0113761">
+                <inertial pos="0.00995038 9.93144e-05 0.000832075" quat="0.692933 0.691803 0.145013 -0.14221"
+                  mass="0.12478" diaginertia="4.80038e-05 4.18024e-05 1.66067e-05"/>
+                <joint name="l_ankle_ie" axis="1 0 0" range="-0.654498 0.305433" actuatorfrcrange="-120 120"
+                  frictionloss="0.89" armature="0.121874" class="ankle_roll"/>
+                <geom class="visual_dark" mesh="l_ankle_ie_link"/>
+                <body name="l_foot_link" quat="0.965926 0 0.258819 0">
+                  <frame pos="0.0614891 -0.00342931 -0.0265273" quat="0.987443 -0.0797175 -0.132426 -0.0326442">
+                    <site name="l_foot_fr" pos="0.1 0.0425 -0.0215"/>
+                    <site name="l_foot_br" pos="-0.1 0.0425 -0.0215"/>
+                    <site name="l_foot_fl" pos="0.1 -0.0425 -0.0215"/>
+                    <site name="l_foot_bl" pos="-0.1 -0.0425 -0.0215"/>
+                  </frame>
+                  <inertial pos="0.056607 -0.00200339 -0.0304112" quat="0.432893 0.587516 0.510475 0.454802"
+                    mass="1.1808" diaginertia="0.0088235 0.00838261 0.00210633"/>
+                  <joint name="l_ankle_pd" axis="0 1 0" range="-1.5708 0.436332" actuatorfrcrange="-150 150" frictionloss="1.87" armature="0.205456" class="ankle_pitch"/>
+                  <geom class="visual_dark" mesh="l_foot_link"/>
+                  <geom name="collision_l_sole" size="0.1 0.0425 0.009" pos="0.0646931 -0.00550529 -0.03843"
+                    quat="0.987443 -0.0797175 -0.132426 -0.0326442" type="box" class="foot_collision"/>
+                  <site name="l_foot" pos="0.0646931 -0.00550529 -0.03843"/>
+                </body>
+              </body>
+            </body>
+          </body>
+        </body>
+      </body>
+      <body name="r_hip_ie_link" pos="-0.02 -0.11 -0.16875" quat="0.957662 -0.126078 -0.256605 -0.0337826">
+        <inertial pos="-0.0275542 -0.000156081 0.0265869" quat="0.0347714 0.433956 0.0469856 0.899036" mass="1.49972"
+          diaginertia="0.00446281 0.00343307 0.00204473"/>
+        <joint name="r_hip_ie" axis="0 0 1" range="-1.09083 0.567232" actuatorfrcrange="-120 120"
+          frictionloss="7.95" armature="0.231424" class="hip_ie"/>
+        <geom class="visual_dark" mesh="r_hip_ie_link"/>
+        <body name="r_hip_aa_link" pos="0 0 0">
+          <inertial pos="0.000193891 -0.000687548 0.00240456" quat="0.469753 0.583843 -0.513458 0.418115"
+            mass="0.429858" diaginertia="0.000369398 0.000323696 0.000129031"/>
+          <joint name="r_hip_aa" axis="1 0 0" range="-0.741765 0.218166" actuatorfrcrange="-494 494"
+            frictionloss="7.0" armature="0.399396" class="hip_aa"/>
+          <geom class="visual_dark" mesh="r_hip_aa_link"/>
+          <body name="r_hip_fe_link" quat="0.957662 0.126079 0.256605 0.0337828">
+            <inertial pos="0.00662296 -0.00380822 -0.207131" quat="0.493002 0.049361 0.00782621 0.868591" mass="10.7924"
+              diaginertia="0.124314 0.120603 0.0499318"/>
+            <joint name="r_hip_fe" axis="0 1 0" range="-1.85005 0.476475" actuatorfrcrange="-342 342" frictionloss="21.06" armature="0.187096" class="hip_fe"/>
+            <geom class="visual_light" mesh="r_hip_fe_link"/>
+            <geom name="collision_capsule_body_r_thigh" size="0.105 0.1" pos="0 -0.005 -0.215" type="capsule"
+              class="collision"/>
+            <body name="r_knee_fe_link" pos="-0.05 0 -0.425">
+              <inertial pos="0.0432854 -0.00516245 -0.152442" quat="0.399848 0.0111994 0.00899692 0.916469"
+                mass="4.57434" diaginertia="0.063915 0.0630953 0.0107961"/>
+              <joint name="r_knee_fe" axis="0 1 0" range="0 2.61799" actuatorfrcrange="-336 336"
+                frictionloss="7.7" armature="0.292264" class="knee"/>
+              <geom class="visual_light" mesh="r_knee_fe_link"/>
+              <geom name="collision_capsule_body_r_shin" size="0.071 0.15" pos="0.0476 0.0061 -0.19"
+                quat="0.998048 0 0.0624593 0" type="capsule" class="collision"/>
+              <body name="r_ankle_ie_link" pos="0.05 0 -0.425" quat="0.987672 -0.0864102 -0.130029 -0.0113761">
+                <inertial pos="0.00995037 -9.921e-05 0.000832071" quat="0.69181 0.692928 0.142207 -0.145006"
+                  mass="0.12478" diaginertia="4.80035e-05 4.18021e-05 1.66065e-05"/>
+                <joint name="r_ankle_ie" axis="1 0 0" range="-0.305433 0.654498" actuatorfrcrange="-120 120"
+                  frictionloss="0.89" armature="0.121874" class="ankle_roll"/>
+                <geom class="visual_dark" mesh="r_ankle_ie_link"/>
+                <body name="r_foot_link" quat="0.965926 0 0.258819 0">
+                  <frame pos="0.0614891 0.00342931 -0.0265273" quat="0.987443 0.0797175 -0.132426 0.0326442">
+                    <site name="r_foot_fr" pos="0.1 0.0425 -0.0215"/>
+                    <site name="r_foot_br" pos="-0.1 0.0425 -0.0215"/>
+                    <site name="r_foot_fl" pos="0.1 -0.0425 -0.0215"/>
+                    <site name="r_foot_bl" pos="-0.1 -0.0425 -0.0215"/>
+                  </frame>
+                  <inertial pos="0.056607 0.00200339 -0.0304112" quat="0.414902 0.606299 0.487904 0.471389"
+                    mass="1.1808" diaginertia="0.00883289 0.00837251 0.00210704"/>
+                  <joint name="r_ankle_pd" axis="0 1 0" range="-1.5708 0.436332" actuatorfrcrange="-150 150" frictionloss="1.87" armature="0.205456" class="ankle_pitch"/>
+                  <geom class="visual_dark" mesh="r_foot_link"/>
+                  <geom name="collision_r_sole" size="0.1 0.0425 0.009" pos="0.0646931 0.00550529 -0.03843"
+                    quat="0.987443 0.0797175 -0.132426 0.0326442" type="box" class="foot_collision"/>
+                  <site name="r_foot" pos="0.0646931 0.00550529 -0.03843"/>
+                </body>
+              </body>
+            </body>
+          </body>
+        </body>
+      </body>
+    </body>
+  </worldbody>
+
+  <contact>
+    <pair name="left_foot_floor" geom1="collision_l_sole" geom2="floor" condim="3" friction="0.6 0.6"/>
+    <pair name="right_foot_floor" geom1="collision_r_sole" geom2="floor" condim="3" friction="0.6 0.6"/>
+    <pair name="left_hand_thigh" geom1="collision_l_hand_plate" geom2="collision_capsule_body_l_thigh" condim="1"/>
+    <pair name="right_hand_thigh" geom1="collision_r_hand_plate" geom2="collision_capsule_body_r_thigh" condim="1"/>
+    <pair name="left_foot_right_foot" geom1="collision_l_sole" geom2="collision_r_sole" condim="1"/>
+    <pair name="left_shin_right_shin" geom1="collision_capsule_body_l_shin" geom2="collision_capsule_body_r_shin" condim="1"/>
+    <pair name="left_thigh_right_thigh" geom1="collision_capsule_body_l_thigh" geom2="collision_capsule_body_r_thigh" condim="1"/>
+  </contact>
+
+  <actuator>
+    <position class="torso_yaw" name="torso_yaw" joint="torso_yaw"/>
+    <position class="torso_roll" name="torso_roll" joint="torso_roll"/>
+    <position class="torso_pitch" name="torso_pitch" joint="torso_pitch"/>
+
+    <position class="neck_yaw" name="neck_yaw" joint="neck_yaw"/>
+    <position class="neck_roll" name="neck_roll" joint="neck_roll"/>
+    <position class="neck_pitch" name="neck_pitch" joint="neck_pitch"/>
+
+    <position class="shoulder_aa" name="l_shoulder_aa" joint="l_shoulder_aa"/>
+    <position class="shoulder_ie" name="l_shoulder_ie" joint="l_shoulder_ie"/>
+    <position class="shoulder_fe" name="l_shoulder_fe" joint="l_shoulder_fe"/>
+    <position class="elbow" name="l_elbow_fe" joint="l_elbow_fe"/>
+    <position class="wrist_roll" name="l_wrist_roll" joint="l_wrist_roll"/>
+    <position class="wrist_yaw" name="l_wrist_yaw" joint="l_wrist_yaw"/>
+    <position class="wrist_pitch" name="l_wrist_pitch" joint="l_wrist_pitch"/>
+
+    <position class="shoulder_aa" name="r_shoulder_aa" joint="r_shoulder_aa"/>
+    <position class="shoulder_ie" name="r_shoulder_ie" joint="r_shoulder_ie"/>
+    <position class="shoulder_fe" name="r_shoulder_fe" joint="r_shoulder_fe"/>
+    <position class="elbow" name="r_elbow_fe" joint="r_elbow_fe"/>
+    <position class="wrist_roll" name="r_wrist_roll" joint="r_wrist_roll"/>
+    <position class="wrist_yaw" name="r_wrist_yaw" joint="r_wrist_yaw"/>
+    <position class="wrist_pitch" name="r_wrist_pitch" joint="r_wrist_pitch"/>
+
+    <position class="hip_ie" name="l_hip_ie" joint="l_hip_ie"/>
+    <position class="hip_aa" name="l_hip_aa" joint="l_hip_aa"/>
+    <position class="hip_fe" name="l_hip_fe" joint="l_hip_fe"/>
+    <position class="knee" name="l_knee_fe" joint="l_knee_fe"/>
+    <position class="ankle_roll" name="l_ankle_ie" joint="l_ankle_ie"/>
+    <position class="ankle_pitch" name="l_ankle_pd" joint="l_ankle_pd"/>
+
+    <position class="hip_ie" name="r_hip_ie" joint="r_hip_ie"/>
+    <position class="hip_aa" name="r_hip_aa" joint="r_hip_aa"/>
+    <position class="hip_fe" name="r_hip_fe" joint="r_hip_fe"/>
+    <position class="knee" name="r_knee_fe" joint="r_knee_fe"/>
+    <position class="ankle_roll" name="r_ankle_ie" joint="r_ankle_ie"/>
+    <position class="ankle_pitch" name="r_ankle_pd" joint="r_ankle_pd"/>
+  </actuator>
+
+  <sensor>
+    <framezaxis objtype="site" objname="imu" name="upvector"/>
+    <framequat name="orientation_torso" objtype="site" objname="imu"/>
+    <gyro name="gyro" site="imu"/>
+    <accelerometer site="imu" name="accelerometer"/>
+    <velocimeter site="imu" name="local_linvel"/>
+    <frameangvel objtype="site" objname="imu" name="global_angvel"/>
+    <framelinvel objtype="site" objname="imu" name="global_linvel"/>
+  </sensor>
+</mujoco>
diff --git a/mujoco_playground/_src/locomotion/apollo/xmls/scene_mjx_feetonly_flat_terrain.xml b/mujoco_playground/_src/locomotion/apollo/xmls/scene_mjx_feetonly_flat_terrain.xml
new file mode 100644
index 000000000..2ad479f09
--- /dev/null
+++ b/mujoco_playground/_src/locomotion/apollo/xmls/scene_mjx_feetonly_flat_terrain.xml
@@ -0,0 +1,60 @@
+<mujoco model="apollo scene">
+  <include file="apollo_mjx_feetonly.xml"/>
+
+  <statistic center="0 0 0.7" extent="1.2" meansize="0.04"/>
+
+  <visual>
+    <headlight diffuse=".8 .8 .8" ambient=".2 .2 .2" specular="1 1 1"/>
+    <rgba force="1 0 0 1"/>
+    <global azimuth="140" elevation="-20"/>
+    <map force="0.01"/>
+    <scale forcewidth="0.3" contactwidth="0.5" contactheight="0.2"/>
+    <quality shadowsize="8192"/>
+  </visual>
+
+  <asset>
+    <texture type="skybox" builtin="gradient" rgb1="1 1 1" rgb2="1 1 1" width="800" height="800"/>
+    <texture type="2d" name="groundplane" builtin="checker" mark="edge" rgb1="1 1 1" rgb2="1 1 1" markrgb="0 0 0"
+      width="300" height="300"/>
+    <material name="groundplane" texture="groundplane" texuniform="true" texrepeat="5 5" reflectance="0"/>
+  </asset>
+
+  <worldbody>
+    <geom name="floor" size="0 0 0.01" type="plane" material="groundplane" priority="1" friction="0.6" condim="3"/>
+  </worldbody>
+
+  <keyframe>
+    <key name="stand"
+      qpos="
+      0 0 1.08
+      1 0 0 0
+      0 0 0
+      0 0 0
+      0.2 0 0.1 -0.4 0 0 0
+      -0.2 0 0.1 -0.4 0 0 0
+      0.08 0.1 -0.2 .4 -0.05 -0.176
+      -0.08 -0.1 -0.2 .4 0.05 -0.176
+      "
+      ctrl="
+      0 0 0
+      0 0 0
+      0.2 0 0.1 -0.4 0 0 0
+      -0.2 0 0.1 -0.4 0 0 0
+      0.08 0.1 -0.2 .4 -0.05 -0.176
+      -0.08 -0.1 -0.2 .4 0.05 -0.176"/>
+    <key name="knees_bent"
+        qpos="
+        0.0 0.0 1.01597
+        1.0 0.0 0.0 0.0
+        0.0 0.0 0.0 0.0 0.0 0.0 0.2 0.0 0.1 -0.4 0.0 0.0 0.0 -0.2 0.0 0.1 -0.4 0.0 0.0 0.0
+        0.08 0.1 -0.477 1.033 -0.03 -0.537 -0.08 -0.1 -0.477 1.033 0.03 -0.537"
+        ctrl="
+        0.0 0.0 0.0
+        0.0 0.0 0.0
+        0.2 0.0 0.1 -0.4 0.0 0.0 0.0
+        -0.2 0.0 0.1 -0.4 0.0 0.0 0.0
+        0.08 0.1 -0.477 1.033 -0.03 -0.537
+        -0.08 -0.1 -0.477 1.033 0.03 -0.537"
+      />
+  </keyframe>
+</mujoco>
diff --git a/mujoco_playground/config/locomotion_params.py b/mujoco_playground/config/locomotion_params.py
index eaa7587d8..cc777a4e1 100644
--- a/mujoco_playground/config/locomotion_params.py
+++ b/mujoco_playground/config/locomotion_params.py
@@ -134,6 +134,19 @@ def brax_ppo_config(env_name: str) -> config_dict.ConfigDict:
         value_obs_key="privileged_state",
     )
 
+  elif env_name in ("ApolloJoystickFlatTerrain",):
+    rl_config.num_timesteps = 200_000_000
+    rl_config.num_evals = 20
+    rl_config.clipping_epsilon = 0.2
+    rl_config.num_resets_per_eval = 1
+    rl_config.entropy_cost = 0.005
+    rl_config.network_factory = config_dict.create(
+      policy_hidden_layer_sizes=(512, 256, 128),
+      value_hidden_layer_sizes=(512, 256, 128),
+      policy_obs_key="state",
+      value_obs_key="privileged_state",
+    )
+
   elif env_name in (
       "BarkourJoystick",
       "H1InplaceGaitTracking",
diff --git a/mujoco_playground/experimental/learning/apollo_joystick.ipynb b/mujoco_playground/experimental/learning/apollo_joystick.ipynb
new file mode 100644
index 000000000..a6a405f61
--- /dev/null
+++ b/mujoco_playground/experimental/learning/apollo_joystick.ipynb
@@ -0,0 +1,301 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import os\n",
+    "\n",
+    "xla_flags = os.environ.get(\"XLA_FLAGS\", \"\")\n",
+    "xla_flags += \" --xla_gpu_triton_gemm_any=True\"\n",
+    "os.environ[\"XLA_FLAGS\"] = xla_flags\n",
+    "os.environ[\"XLA_PYTHON_CLIENT_PREALLOCATE\"] = \"false\"\n",
+    "os.environ[\"MUJOCO_GL\"] = \"egl\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import functools\n",
+    "import json\n",
+    "import pickle\n",
+    "from datetime import datetime\n",
+    "\n",
+    "import jax\n",
+    "import mediapy as media\n",
+    "import mujoco\n",
+    "import numpy as np\n",
+    "from brax.training.agents.ppo import networks as ppo_networks\n",
+    "from brax.training.agents.ppo import train as ppo\n",
+    "from etils import epath\n",
+    "from flax.training import orbax_utils\n",
+    "from orbax import checkpoint as ocp\n",
+    "\n",
+    "from mujoco_playground import registry, wrapper\n",
+    "from mujoco_playground.config import locomotion_params\n",
+    "from mujoco_playground.experimental.utils.plotting import TrainingPlotter\n",
+    "\n",
+    "# Enable persistent compilation cache.\n",
+    "jax.config.update(\"jax_compilation_cache_dir\", \"/tmp/jax_cache\")\n",
+    "jax.config.update(\"jax_persistent_cache_min_entry_size_bytes\", -1)\n",
+    "jax.config.update(\"jax_persistent_cache_min_compile_time_secs\", 0)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "env_name = \"ApolloJoystickFlatTerrain\"\n",
+    "env_cfg = registry.get_default_config(env_name)\n",
+    "randomizer = registry.get_domain_randomizer(env_name)\n",
+    "ppo_params = locomotion_params.brax_ppo_config(env_name)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "env_cfg.reward_config.scales.energy = -1e-5\n",
+    "env_cfg.reward_config.scales.action_rate = -1e-3\n",
+    "env_cfg.reward_config.scales.torques = 0.0\n",
+    "\n",
+    "env_cfg.noise_config.level = 0.0  # 1.0\n",
+    "env_cfg.push_config.enable = True\n",
+    "env_cfg.push_config.magnitude_range = [0.1, 2.0]\n",
+    "\n",
+    "ppo_params.num_timesteps = 150_000_000\n",
+    "ppo_params.num_evals = 15"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "SUFFIX = None\n",
+    "FINETUNE_PATH = None\n",
+    "\n",
+    "# Generate unique experiment name.\n",
+    "now = datetime.now()\n",
+    "timestamp = now.strftime(\"%Y%m%d-%H%M%S\")\n",
+    "exp_name = f\"{env_name}-{timestamp}\"\n",
+    "if SUFFIX is not None:\n",
+    "  exp_name += f\"-{SUFFIX}\"\n",
+    "print(f\"{exp_name}\")\n",
+    "\n",
+    "# Possibly restore from the latest checkpoint.\n",
+    "if FINETUNE_PATH is not None:\n",
+    "  FINETUNE_PATH = epath.Path(FINETUNE_PATH)\n",
+    "  latest_ckpts = list(FINETUNE_PATH.glob(\"*\"))\n",
+    "  latest_ckpts = [ckpt for ckpt in latest_ckpts if ckpt.is_dir()]\n",
+    "  latest_ckpts.sort(key=lambda x: int(x.name))\n",
+    "  latest_ckpt = latest_ckpts[-1]\n",
+    "  restore_checkpoint_path = latest_ckpt\n",
+    "  print(f\"Restoring from: {restore_checkpoint_path}\")\n",
+    "else:\n",
+    "  restore_checkpoint_path = None"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "ckpt_path = epath.Path(\"checkpoints\").resolve() / exp_name\n",
+    "ckpt_path.mkdir(parents=True, exist_ok=True)\n",
+    "print(f\"{ckpt_path}\")\n",
+    "\n",
+    "with open(ckpt_path / \"config.json\", \"w\") as fp:\n",
+    "  json.dump(env_cfg.to_json(), fp, indent=4)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "plotter = TrainingPlotter(max_timesteps=ppo_params.num_timesteps, figsize=(15, 10))\n",
+    "\n",
+    "\n",
+    "def progress(num_steps, metrics):\n",
+    "  plotter.update(num_steps, metrics)\n",
+    "\n",
+    "\n",
+    "def policy_params_fn(current_step, make_policy, params):\n",
+    "  del make_policy  # Unused.\n",
+    "  orbax_checkpointer = ocp.PyTreeCheckpointer()\n",
+    "  save_args = orbax_utils.save_args_from_target(params)\n",
+    "  path = ckpt_path / f\"{current_step}\"\n",
+    "  orbax_checkpointer.save(path, params, force=True, save_args=save_args)\n",
+    "\n",
+    "\n",
+    "training_params = dict(ppo_params)\n",
+    "del training_params[\"network_factory\"]\n",
+    "\n",
+    "train_fn = functools.partial(\n",
+    "  ppo.train,\n",
+    "  **training_params,\n",
+    "  network_factory=functools.partial(\n",
+    "    ppo_networks.make_ppo_networks, **ppo_params.network_factory\n",
+    "  ),\n",
+    "  restore_checkpoint_path=restore_checkpoint_path,\n",
+    "  progress_fn=progress,\n",
+    "  wrap_env_fn=wrapper.wrap_for_brax_training,\n",
+    "  policy_params_fn=policy_params_fn,\n",
+    "  randomization_fn=randomizer,\n",
+    ")\n",
+    "\n",
+    "env = registry.load(env_name, config=env_cfg)\n",
+    "eval_env = registry.load(env_name, config=env_cfg)\n",
+    "make_inference_fn, params, _ = train_fn(environment=env, eval_env=eval_env)\n",
+    "if len(plotter.times) > 1:\n",
+    "  print(f\"time to jit: {plotter.times[1] - plotter.times[0]}\")\n",
+    "  print(f\"time to train: {plotter.times[-1] - plotter.times[1]}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "inference_fn = make_inference_fn(params, deterministic=True)\n",
+    "jit_inference_fn = jax.jit(inference_fn)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Save normalizer and policy params to the checkpoint dir.\n",
+    "normalizer_params, policy_params, value_params = params\n",
+    "with open(ckpt_path / \"params.pkl\", \"wb\") as f:\n",
+    "  data = {\n",
+    "    \"normalizer_params\": normalizer_params,\n",
+    "    \"policy_params\": policy_params,\n",
+    "    \"value_params\": value_params,\n",
+    "  }\n",
+    "  pickle.dump(data, f)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from mujoco_playground._src.gait import draw_joystick_command\n",
+    "\n",
+    "eval_env = registry.load(env_name, config=env_cfg)\n",
+    "jit_reset = jax.jit(eval_env.reset)\n",
+    "jit_step = jax.jit(eval_env.step)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "rng = jax.random.PRNGKey(12345)\n",
+    "rollout = []\n",
+    "modify_scene_fns = []\n",
+    "state = jit_reset(rng)\n",
+    "for i in range(env_cfg.episode_length):\n",
+    "  act_rng, rng = jax.random.split(rng)\n",
+    "  ctrl, _ = jit_inference_fn(state.obs, act_rng)\n",
+    "  state = jit_step(state, ctrl)\n",
+    "  if state.done:\n",
+    "    print(\"something bad happened\")\n",
+    "    break\n",
+    "  rollout.append(state)\n",
+    "  xyz = np.array(state.data.xpos[eval_env.mj_model.body(\"torso_link\").id])\n",
+    "  xyz += np.array([0, 0.0, 0])\n",
+    "  x_axis = state.data.xmat[eval_env._torso_body_id, 0]\n",
+    "  yaw = -np.arctan2(x_axis[1], x_axis[0])\n",
+    "  modify_scene_fns.append(\n",
+    "    functools.partial(\n",
+    "      draw_joystick_command,\n",
+    "      cmd=state.info[\"command\"],\n",
+    "      xyz=xyz,\n",
+    "      theta=yaw,\n",
+    "      scl=np.linalg.norm(state.info[\"command\"]),\n",
+    "    )\n",
+    "  )"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "render_every = 2\n",
+    "fps = 1.0 / eval_env.dt / render_every\n",
+    "print(f\"fps: {fps}\")\n",
+    "traj = rollout[::render_every]\n",
+    "mod_fns = modify_scene_fns[::render_every]\n",
+    "\n",
+    "scene_option = mujoco.MjvOption()\n",
+    "scene_option.geomgroup[2] = True\n",
+    "scene_option.geomgroup[3] = False\n",
+    "scene_option.flags[mujoco.mjtVisFlag.mjVIS_CONTACTPOINT] = True\n",
+    "scene_option.flags[mujoco.mjtVisFlag.mjVIS_CONTACTFORCE] = False\n",
+    "scene_option.flags[mujoco.mjtVisFlag.mjVIS_TRANSPARENT] = False\n",
+    "scene_option.flags[mujoco.mjtVisFlag.mjVIS_PERTFORCE] = False\n",
+    "\n",
+    "frames = eval_env.render(\n",
+    "  traj,\n",
+    "  camera=\"track\",\n",
+    "  scene_option=scene_option,\n",
+    "  width=640,\n",
+    "  height=480,\n",
+    "  modify_scene_fns=mod_fns,\n",
+    ")\n",
+    "media.show_video(frames, fps=fps, loop=False)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
diff --git a/mujoco_playground/experimental/sim2sim/onnx/apollo_policy.onnx b/mujoco_playground/experimental/sim2sim/onnx/apollo_policy.onnx
new file mode 100644
index 000000000..604e6e78b
Binary files /dev/null and b/mujoco_playground/experimental/sim2sim/onnx/apollo_policy.onnx differ
diff --git a/mujoco_playground/experimental/sim2sim/play_apollo_joystick.py b/mujoco_playground/experimental/sim2sim/play_apollo_joystick.py
new file mode 100644
index 000000000..d879ead9f
--- /dev/null
+++ b/mujoco_playground/experimental/sim2sim/play_apollo_joystick.py
@@ -0,0 +1,142 @@
+# Copyright 2024 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+"""Deploy an MJX policy in ONNX format to C MuJoCo and play with it."""
+
+import mujoco
+import numpy as np
+import onnxruntime as rt
+from etils import epath
+from mujoco import viewer
+
+from mujoco_playground._src.locomotion.apollo import constants as apollo_constants
+from mujoco_playground._src.locomotion.apollo.base import get_assets
+from mujoco_playground.experimental.sim2sim.gamepad_reader import Gamepad
+
+_HERE = epath.Path(__file__).parent
+_ONNX_DIR = _HERE / "onnx"
+
+
+class OnnxController:
+  """ONNX controller for the Booster Apollo humanoid."""
+
+  def __init__(
+    self,
+    policy_path: str,
+    default_angles: np.ndarray,
+    ctrl_dt: float,
+    n_substeps: int,
+    action_scale: float = 0.5,
+    vel_scale_x: float = 1.0,
+    vel_scale_y: float = 1.0,
+    vel_scale_rot: float = 1.0,
+  ):
+    self._output_names = ["continuous_actions"]
+    self._policy = rt.InferenceSession(policy_path, providers=["CPUExecutionProvider"])
+
+    self._action_scale = action_scale
+    self._default_angles = default_angles
+    self._last_action = np.zeros_like(default_angles, dtype=np.float32)
+
+    self._counter = 0
+    self._n_substeps = n_substeps
+    self._ctrl_dt = ctrl_dt
+
+    self._phase = np.array([0.0, np.pi])
+    self._base_phase_dt = 2 * np.pi * ctrl_dt  # Store base phase_dt without frequency
+
+    self._joystick = Gamepad(
+      vel_scale_x=vel_scale_x,
+      vel_scale_y=vel_scale_y,
+      vel_scale_rot=vel_scale_rot,
+      deadzone=0.03,
+    )
+
+  def get_obs(self, model, data) -> np.ndarray:
+    linvel = data.sensor("local_linvel").data
+    gyro = data.sensor("gyro").data
+    imu_xmat = data.site_xmat[model.site("imu").id].reshape(3, 3)
+    gravity = imu_xmat.T @ np.array([0, 0, -1])
+    joint_angles = data.qpos[7:] - self._default_angles
+    joint_velocities = data.qvel[6:]
+    command = self._joystick.get_command()
+    ph = self._phase if np.linalg.norm(command) >= 0.01 else np.ones(2) * np.pi
+    phase = np.concatenate([np.cos(ph), np.sin(ph)])
+    obs = np.hstack(
+      [
+        linvel,
+        gyro,
+        gravity,
+        command,
+        joint_angles,
+        joint_velocities,
+        self._last_action,
+        phase,
+      ]
+    )
+    return obs.astype(np.float32)
+
+  def get_control(self, model: mujoco.MjModel, data: mujoco.MjData) -> None:
+    self._counter += 1
+    if self._counter % self._n_substeps == 0:
+      obs = self.get_obs(model, data)
+      onnx_input = {"obs": obs.reshape(1, -1)}
+      onnx_pred = self._policy.run(self._output_names, onnx_input)[0][0]
+      self._last_action = onnx_pred.copy()
+      data.ctrl[:] = onnx_pred * self._action_scale + self._default_angles
+      command = self._joystick.get_command()
+      cmd_magnitude = np.linalg.norm(command)
+      if cmd_magnitude < 0.01:
+        gait_freq = 1.25
+      else:
+        gait_freq = 1.25 + 0.5 * min(cmd_magnitude, 1.5) / 1.5
+      phase_dt = self._base_phase_dt * gait_freq
+      phase_tp1 = self._phase + phase_dt
+      self._phase = np.fmod(phase_tp1 + np.pi, 2 * np.pi) - np.pi
+
+
+def load_callback(model=None, data=None):
+  mujoco.set_mjcb_control(None)
+
+  model = mujoco.MjModel.from_xml_path(
+    apollo_constants.FEET_ONLY_FLAT_TERRAIN_XML.as_posix(),
+    assets=get_assets(),
+  )
+  data = mujoco.MjData(model)
+
+  mujoco.mj_resetDataKeyframe(model, data, 0)
+
+  ctrl_dt = 0.02
+  sim_dt = 0.005
+  n_substeps = int(round(ctrl_dt / sim_dt))
+  model.opt.timestep = sim_dt
+
+  policy = OnnxController(
+    policy_path=(_ONNX_DIR / "apollo_policy.onnx").as_posix(),
+    default_angles=np.array(model.keyframe("knees_bent").qpos[7:]),
+    ctrl_dt=ctrl_dt,
+    n_substeps=n_substeps,
+    action_scale=0.5,
+    vel_scale_x=1.5,
+    vel_scale_y=0.8,
+    vel_scale_rot=1.5,
+  )
+
+  mujoco.set_mjcb_control(policy.get_control)
+
+  return model, data
+
+
+if __name__ == "__main__":
+  viewer.launch(loader=load_callback)
diff --git a/mujoco_playground/experimental/utils/plotting.py b/mujoco_playground/experimental/utils/plotting.py
new file mode 100644
index 000000000..be7809abb
--- /dev/null
+++ b/mujoco_playground/experimental/utils/plotting.py
@@ -0,0 +1,337 @@
+# Copyright 2024 DeepMind Technologies Limited
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ==============================================================================
+from datetime import datetime
+from typing import Any, Dict, List, Tuple
+
+import matplotlib.pyplot as plt
+import numpy as np
+from IPython.display import clear_output, display
+
+
+class TrainingPlotter:
+  def __init__(
+    self,
+    max_timesteps: int = 50_000_000,
+    figsize: Tuple[int, int] = (12, 8),
+    max_cols: int = 3,
+  ):
+    self.max_timesteps = max_timesteps
+    self.max_cols = max_cols
+
+    # Default main metrics that we always want to plot.
+    self.default_metrics = [
+      "eval/episode_reward",
+      "eval/avg_episode_length",
+      "steps_per_second",
+    ]
+
+    self.metrics = []
+    self.metrics_std = []
+    self.metric_labels = []
+    self.error_metrics = []
+    self.error_metrics_std = []
+    self.error_metric_labels = []
+    self.reward_detail_metrics = []
+    self.reward_detail_metrics_std = []
+    self.reward_detail_metric_labels = []
+    self.termination_metrics = []
+    self.termination_metrics_std = []
+    self.termination_metric_labels = []
+
+    self.x_data = []
+    self.times = [datetime.now()]
+    self.metrics_data = {}
+    self.metrics_std_data = {}
+
+    self.fps_data = []  # Store calculated steps per second
+
+    # Use default matplotlib style
+    plt.rcParams["axes.grid"] = False
+    plt.rcParams["axes.edgecolor"] = "#888888"
+    plt.rcParams["axes.linewidth"] = 0.8
+
+    # Create initial figure and axes - we'll resize this later
+    n_cols = min(self.max_cols, 1)  # Start with at least 1 column, but respect max_cols
+    n_rows = 1
+    self.fig, self.axes = plt.subplots(n_rows, n_cols, figsize=figsize)
+    self.axes = np.array([[self.axes]])
+
+    # Set figure background to white for clean look
+    self.fig.patch.set_facecolor("white")
+
+    # Set up the layout with reasonable spacing
+    plt.tight_layout(pad=2.5, h_pad=1.5, w_pad=1.0)
+
+  def _get_label_from_metric(self, metric: str) -> str:
+    parts = metric.split("/")
+    if len(parts) > 1:
+      label = parts[-1]
+    else:
+      label = metric
+    if label == "episode_reward":
+      return "reward_per_episode"
+    elif label == "avg_episode_length":
+      return "episode_length"
+    elif label == "steps_per_second":
+      return "steps_per_second"
+    else:
+      return label
+
+  def _initialize_metrics(self, metrics: Dict[str, Any]) -> None:
+    """Initialize all metrics from the first metrics dictionary."""
+    # Start with default metrics
+    self.metrics = self.default_metrics.copy()
+    self.metrics_std = [f"{m}_std" for m in self.metrics]
+    self.metric_labels = [self._get_label_from_metric(m) for m in self.metrics]
+
+    # Initialize data storage for default metrics
+    for metric in self.metrics:
+      self.metrics_data[metric] = []
+    for metric_std in self.metrics_std:
+      self.metrics_std_data[metric_std] = []
+
+    # Find all reward detail metrics (eval/episode_reward/*)
+    reward_prefix = "eval/episode_reward/"
+    for key in metrics:
+      if (
+        key.startswith(reward_prefix)
+        and not key.endswith("_std")
+        and key != "eval/episode_reward"
+      ):
+        self.reward_detail_metrics.append(key)
+        self.reward_detail_metrics_std.append(f"{key}_std")
+        label = key[len(reward_prefix) :]
+        self.reward_detail_metric_labels.append(label)  # Keep underscores
+
+        # Initialize data storage
+        self.metrics_data[key] = []
+        self.metrics_std_data[f"{key}_std"] = []
+
+    # Find all error metrics (eval/episode_error/*)
+    error_prefix = "eval/episode_error/"
+    for key in metrics:
+      if key.startswith(error_prefix) and not key.endswith("_std"):
+        self.error_metrics.append(key)
+        self.error_metrics_std.append(f"{key}_std")
+        label = key[len(error_prefix) :]
+        self.error_metric_labels.append(label)  # Keep underscores
+
+        # Initialize data storage
+        self.metrics_data[key] = []
+        self.metrics_std_data[f"{key}_std"] = []
+
+    # Find all termination metrics (eval/episode_termination/*)
+    termination_prefix = "eval/episode_termination/"
+    for key in metrics:
+      if key.startswith(termination_prefix) and not key.endswith("_std"):
+        self.termination_metrics.append(key)
+        self.termination_metrics_std.append(f"{key}_std")
+        label = key[len(termination_prefix) :]
+        self.termination_metric_labels.append(label)  # Keep underscores
+
+        # Initialize data storage
+        self.metrics_data[key] = []
+        self.metrics_std_data[f"{key}_std"] = []
+
+  def update(self, num_steps: int, metrics: Dict[str, float]) -> None:
+    self.x_data.append(num_steps)
+    current_time = datetime.now()
+    self.times.append(current_time)
+
+    # Calculate steps per second if we have at least two data points
+    if len(self.x_data) > 1:
+      time_diff = (current_time - self.times[-2]).total_seconds()
+      steps_diff = self.x_data[-1] - self.x_data[-2]
+      if time_diff > 0:
+        fps = steps_diff / time_diff
+      else:
+        fps = 0
+      self.fps_data.append(fps)
+    else:
+      self.fps_data.append(0)  # First point has no previous data to compare
+
+    # Initialize metrics if this is the first update.
+    if len(self.x_data) == 1:
+      self._initialize_metrics(metrics)
+      # Add fps to metrics data structure
+      self.metrics_data["steps_per_second"] = []
+      self.metrics_std_data["steps_per_second_std"] = []
+
+    # Update all metrics data.
+    all_metrics = (
+      self.metrics
+      + self.reward_detail_metrics
+      + self.error_metrics
+      + self.termination_metrics
+    )
+    all_metrics_std = (
+      self.metrics_std
+      + self.reward_detail_metrics_std
+      + self.error_metrics_std
+      + self.termination_metrics_std
+    )
+
+    for metric in all_metrics:
+      if metric == "steps_per_second":
+        self.metrics_data[metric].append(self.fps_data[-1])
+      elif metric in metrics:
+        self.metrics_data[metric].append(metrics[metric])
+      else:
+        last_value = self.metrics_data[metric][-1] if self.metrics_data[metric] else 0
+        self.metrics_data[metric].append(last_value)
+
+    for metric_std in all_metrics_std:
+      if metric_std in metrics:
+        self.metrics_std_data[metric_std].append(metrics[metric_std])
+      else:
+        last_value = (
+          self.metrics_std_data[metric_std][-1]
+          if self.metrics_std_data[metric_std]
+          else 0
+        )
+        self.metrics_std_data[metric_std].append(last_value)
+
+    clear_output(wait=True)
+
+    # Combine all metrics for plotting.
+    all_metrics = (
+      self.metrics
+      + self.reward_detail_metrics
+      + self.error_metrics
+      + self.termination_metrics
+    )
+    all_metrics_std = (
+      self.metrics_std
+      + self.reward_detail_metrics_std
+      + self.error_metrics_std
+      + self.termination_metrics_std
+    )
+    all_labels = (
+      self.metric_labels
+      + self.reward_detail_metric_labels
+      + self.error_metric_labels
+      + self.termination_metric_labels
+    )
+
+    # Calculate grid dimensions using max_cols.
+    total_plots = len(all_metrics)
+    n_cols = min(self.max_cols, total_plots)  # Use max_cols parameter.
+    n_rows = (total_plots + n_cols - 1) // n_cols  # Ceiling division.
+
+    # Check if we need to resize the axes grid
+    if n_rows > self.axes.shape[0] or n_cols > self.axes.shape[1]:
+      plt.close(self.fig)
+      # Calculate a better figure size based on the number of plots and columns
+      width = max(12, n_cols * 3.5)  # 3.5 inches per column
+      height = max(8, n_rows * 2.5)  # 2.5 inches per row
+      self.fig, self.axes = plt.subplots(n_rows, n_cols, figsize=(width, height))
+
+      # Handle case where there's only one plot.
+      if n_rows == 1 and n_cols == 1:
+        self.axes = np.array([[self.axes]])
+      elif n_rows == 1:
+        self.axes = np.array([self.axes])
+      elif n_cols == 1:
+        self.axes = np.array([[ax] for ax in self.axes])
+
+    # Plot all metrics
+    self._plot_metrics(all_metrics, all_metrics_std, all_labels, self.axes)
+
+    # Add a single x-axis label at the bottom of the figure.
+    self.fig.text(
+      0.5, 0.01, "# environment steps", ha="center", fontsize=12, fontweight="bold"
+    )
+
+    # Update layout and display.
+    self.fig.tight_layout(pad=2.5, h_pad=1.5, w_pad=1.0)
+    self.fig.subplots_adjust(bottom=0.08)
+    display(self.fig)
+
+  def _plot_metrics(
+    self,
+    metrics_list: List[str],
+    metrics_std_list: List[str],
+    labels_list: List[str],
+    axes_grid: np.ndarray,
+  ) -> None:
+    """Plot a set of metrics on the given axes grid."""
+    for i, (metric, metric_std, label) in enumerate(
+      zip(metrics_list, metrics_std_list, labels_list)
+    ):
+      row, col = i // axes_grid.shape[1], i % axes_grid.shape[1]
+      if row < axes_grid.shape[0] and col < axes_grid.shape[1]:
+        ax = axes_grid[row][col]
+        ax.clear()
+        ax.set_xlim([0, self.max_timesteps * 1.25])
+
+        # Remove x-axis labels from all subplots
+        ax.set_xlabel("")
+
+        # Make tick labels smaller to save space
+        ax.tick_params(axis="both", which="major", labelsize=9)
+
+        # Add subtle grid for better readability
+        ax.grid(True, linestyle="-", linewidth=0.5, alpha=0.2)
+
+        # Clean background
+        ax.set_facecolor("white")
+
+        # Format y-axis with fewer decimal places for cleaner look
+        ax.ticklabel_format(axis="y", style="plain", useOffset=False)
+
+        y_values = self.metrics_data[metric]
+        yerr_values = (
+          self.metrics_std_data[metric_std]
+          if metric_std in self.metrics_std_data
+          else None
+        )
+
+        if y_values:
+          # Add prefix based on metric type
+          prefix = ""
+          if "eval/episode_error/" in metric:
+            prefix = "error/"
+          elif "eval/episode_reward/" in metric:
+            prefix = "reward/"
+          elif "eval/episode_termination/" in metric:
+            prefix = "termination/"
+
+          # Use smaller font for title to save space
+          ax.set_title(
+            f"{prefix}{label}: {y_values[-1]:.3f}", fontsize=10, fontweight="bold"
+          )
+
+          # Plot the line with improved styling
+          line = ax.errorbar(
+            self.x_data,
+            y_values,
+            yerr=yerr_values,
+            color="black",
+            linewidth=1.5,
+            elinewidth=0.7,
+            capsize=2,
+          )
+
+          # Add very subtle shading under the curve for better visibility
+          ax.fill_between(self.x_data, 0, y_values, alpha=0.05, color="black")
+
+    # Hide unused subplots
+    for i in range(len(metrics_list), axes_grid.shape[0] * axes_grid.shape[1]):
+      row, col = i // axes_grid.shape[1], i % axes_grid.shape[1]
+      if row < axes_grid.shape[0] and col < axes_grid.shape[1]:
+        axes_grid[row][col].set_visible(False)
+
+  def save_figure(self, filename: str) -> None:
+    self.fig.savefig(filename, dpi=300, bbox_inches="tight")