From 4b5fcb4d6753534edaa861694f65e17f8b462edc Mon Sep 17 00:00:00 2001
From: yuanhaonan <yuanhaonan@dexforce.top>
Date: Mon, 25 May 2026 10:55:42 +0800
Subject: [PATCH 1/4] standardize lerobot key

---
 docs/source/overview/gym/dataset_functors.md  |  8 ++--
 docs/source/tutorial/data_generation.rst      |  2 +-
 embodichain/data/enum.py                      | 25 +++++++++++++
 embodichain/lab/gym/envs/managers/datasets.py | 37 +++++++------------
 .../envs/managers/test_dataset_functors.py    | 19 +++++-----
 5 files changed, 51 insertions(+), 40 deletions(-)

diff --git a/docs/source/overview/gym/dataset_functors.md b/docs/source/overview/gym/dataset_functors.md
index c043ee68..92fc71cb 100644
--- a/docs/source/overview/gym/dataset_functors.md
+++ b/docs/source/overview/gym/dataset_functors.md
@@ -73,12 +73,10 @@ The ``LeRobotRecorder`` functor enables recording robot learning episodes in the
 
 The LeRobotRecorder saves the following data for each frame:
 
-- ``observation.qpos``: Joint positions
-- ``observation.qvel``: Joint velocities
-- ``observation.qf``: Joint forces/torques
+- ``observation.state``: Joint positions (proprioceptive state)
 - ``action``: Applied action
-- ``{sensor_name}.color``: Camera images (if sensors present)
-- ``{sensor_name}.color_right``: Right camera images (for stereo cameras)
+- ``observation.images.{sensor_name}``: Camera images (if sensors present)
+- ``observation.images.{sensor_name}_right``: Right camera images (for stereo cameras)
 
 ## Usage Example
 
diff --git a/docs/source/tutorial/data_generation.rst b/docs/source/tutorial/data_generation.rst
index ca994f3d..741241e8 100644
--- a/docs/source/tutorial/data_generation.rst
+++ b/docs/source/tutorial/data_generation.rst
@@ -83,7 +83,7 @@ Important parameters are:
 - **env.control_parts**: Controlled robot parts in the environment.
 
 
-In the current implementation, ``LeRobotRecorder`` stores robot state and action features such as ``observation.qpos``, ``observation.qvel``, ``observation.qf``, ``action``, and camera images when sensors are present.
+In the current implementation, ``LeRobotRecorder`` stores robot state and action features following LeRobot official format: ``observation.state`` for joint positions, ``action`` for applied actions, and ``observation.images.{sensor_name}`` for camera images.
 
 Step 2: Prepare the Action Configuration
 ----------------------------------------
diff --git a/embodichain/data/enum.py b/embodichain/data/enum.py
index 2902045c..78f32fe5 100644
--- a/embodichain/data/enum.py
+++ b/embodichain/data/enum.py
@@ -74,3 +74,28 @@ class EefType(Enum):
 class ActionMode(Enum):
     ABSOLUTE = ""
     RELATIVE = "delta_"  # This indicates the action is relative change with respect to last state.
+
+
+class LeRobotKey(Enum):
+    """LeRobot standard field keys - official LeRobot dataset format."""
+
+    OBS_STR = "observation"
+    OBS_PREFIX = "observation."
+    OBS_ENV_STATE = "observation.environment_state"
+    OBS_STATE = "observation.state"
+    OBS_IMAGE = "observation.image"
+    OBS_IMAGES = "observation.images"
+    OBS_LANGUAGE = "observation.language"
+    OBS_LANGUAGE_TOKENS = "observation.language.tokens"
+    OBS_LANGUAGE_ATTENTION_MASK = "observation.language.attention_mask"
+    OBS_LANGUAGE_SUBTASK = "observation.subtask"
+    OBS_LANGUAGE_SUBTASK_TOKENS = "observation.subtask.tokens"
+    OBS_LANGUAGE_SUBTASK_ATTENTION_MASK = "observation.subtask.attention_mask"
+    ACTION = "action"
+    ACTION_PREFIX = "action."
+    ACTION_TOKENS = "action.tokens"
+    ACTION_TOKEN_MASK = "action.token_mask"
+    REWARD = "next.reward"
+    TRUNCATED = "next.truncated"
+    DONE = "next.done"
+    INFO = "info"
diff --git a/embodichain/lab/gym/envs/managers/datasets.py b/embodichain/lab/gym/envs/managers/datasets.py
index 005eb699..f84f5875 100644
--- a/embodichain/lab/gym/envs/managers/datasets.py
+++ b/embodichain/lab/gym/envs/managers/datasets.py
@@ -30,6 +30,7 @@
 
 from embodichain.utils import logger
 from embodichain.data.constants import EMBODICHAIN_DEFAULT_DATASET_ROOT
+from embodichain.data.enum import LeRobotKey
 from embodichain.lab.gym.utils.misc import is_stereocam
 from embodichain.lab.sim.sensors import Camera, ContactSensor
 from .manager_base import Functor
@@ -275,17 +276,7 @@ def _build_features(self) -> Dict:
             self._env.robot.joint_names[i] for i in self._env.active_joint_ids
         ]
 
-        features["observation.qpos"] = {
-            "dtype": "float32",
-            "shape": (state_dim,),
-            "names": joint_names,
-        }
-        features["observation.qvel"] = {
-            "dtype": "float32",
-            "shape": (state_dim,),
-            "names": joint_names,
-        }
-        features["observation.qf"] = {
+        features[LeRobotKey.OBS_STATE.value] = {
             "dtype": "float32",
             "shape": (state_dim,),
             "names": joint_names,
@@ -293,7 +284,7 @@ def _build_features(self) -> Dict:
 
         # Use full qpos dimension for action (includes gripper)
         action_dim = state_dim
-        features["action"] = {
+        features[LeRobotKey.ACTION.value] = {
             "dtype": "float32",
             "shape": (action_dim,),
             "names": joint_names,
@@ -316,14 +307,14 @@ def _build_features(self) -> Dict:
                                 f"Only support 'color' frame for vision sensors, but got '{frame_name}' in sensor '{sensor_name}'"
                             )
 
-                        features[f"{sensor_name}.{frame_name}"] = {
+                        features[f"{LeRobotKey.OBS_IMAGES.value}.{sensor_name}"] = {
                             "dtype": "video" if self.use_videos else "image",
                             "shape": (sensor.cfg.height, sensor.cfg.width, 3),
                             "names": ["height", "width", "channel"],
                         }
 
                         if is_stereo:
-                            features[f"{sensor_name}.{frame_name}_right"] = {
+                            features[f"{LeRobotKey.OBS_IMAGES.value}.{sensor_name}_right"] = {
                                 "dtype": "video" if self.use_videos else "image",
                                 "shape": (sensor.cfg.height, sensor.cfg.width, 3),
                                 "names": ["height", "width", "channel"],
@@ -379,7 +370,7 @@ def _add_nested_features(
                 # Recursively handle deeper nesting
                 self._add_nested_features(features, f"{key}.{sub_key}", sub_space)
             else:
-                feature_name = f"observation.{key}.{sub_key}"
+                feature_name = f"{LeRobotKey.OBS_PREFIX.value}{key}.{sub_key}"
                 # Handle empty shapes for scalar values (e.g., mass, friction, damping)
                 # LeRobot requires non-empty shapes, so convert () to (1,)
                 shape = sub_space.shape if sub_space.shape else (1,)
@@ -463,12 +454,12 @@ def _convert_frame_to_lerobot(
 
                     color_data = obs["sensor"][sensor_name]["color"]
                     color_img = color_data[:, :, :3].cpu()
-                    frame[f"{sensor_name}.color"] = color_img
+                    frame[f"{LeRobotKey.OBS_IMAGES.value}.{sensor_name}"] = color_img
 
                     if is_stereo:
                         color_right_data = obs["sensor"][sensor_name]["color_right"]
                         color_right_img = color_right_data[:, :, :3].cpu()
-                        frame[f"{sensor_name}.color_right"] = color_right_img
+                        frame[f"{LeRobotKey.OBS_IMAGES.value}.{sensor_name}_right"] = color_right_img
                 elif isinstance(sensor, ContactSensor):
                     for frame_name in value.keys():
                         frame[f"{sensor_name}.{frame_name}"] = obs["sensor"][
@@ -481,10 +472,8 @@ def _convert_frame_to_lerobot(
                         f"Unsupported sensor type for '{sensor_name}' when converting to LeRobot format. Currently only support Camera and ContactSensor."
                     )
 
-        # Add state
-        frame["observation.qpos"] = obs["robot"]["qpos"].cpu()
-        frame["observation.qvel"] = obs["robot"]["qvel"].cpu()
-        frame["observation.qf"] = obs["robot"]["qf"].cpu()
+        # Add state (use LeRobot standard key "observation.state")
+        frame[LeRobotKey.OBS_STATE.value] = obs["robot"]["qpos"].cpu()
 
         # Add extra observation features if they exist
         for key in obs.keys():
@@ -516,7 +505,7 @@ def _convert_frame_to_lerobot(
             if isinstance(action_tensor, torch.Tensor):
                 action_data = action_tensor.cpu()
 
-        frame["action"] = action_data
+        frame[LeRobotKey.ACTION.value] = action_data
 
         return frame
 
@@ -548,7 +537,7 @@ def _add_nested_obs_to_frame(
                 # Handle 0D tensors (scalars) - convert to 1D for LeRobot compatibility
                 if isinstance(value, torch.Tensor) and value.ndim == 0:
                     value = value.unsqueeze(0)
-                frame[f"observation.{key}.{sub_key}"] = value
+                frame[f"{LeRobotKey.OBS_PREFIX.value}{key}.{sub_key}"] = value
 
     def _update_dataset_info(self, updates: dict) -> bool:
         """Update dataset metadata."""
@@ -561,4 +550,4 @@ def _update_dataset_info(self, updates: dict) -> bool:
             return True
         except Exception as e:
             logger.log_error(f"Failed to update dataset info: {e}")
-            return False
+            return False
\ No newline at end of file
diff --git a/tests/gym/envs/managers/test_dataset_functors.py b/tests/gym/envs/managers/test_dataset_functors.py
index 1acd54b6..fe416eb4 100644
--- a/tests/gym/envs/managers/test_dataset_functors.py
+++ b/tests/gym/envs/managers/test_dataset_functors.py
@@ -29,13 +29,15 @@
         LEROBOT_AVAILABLE,
     )
 
+    from embodichain.data.enum import LeRobotKey
     LEROBOT_AVAILABLE = True
 except ImportError:
     LEROBOT_AVAILABLE = False
     LeRobotRecorder = None
-
+    LeRobotKey = None
 
 # Import Camera for mocking (only if available)
+
 try:
     from embodichain.lab.sim.sensors import Camera
 
@@ -228,15 +230,12 @@ def test_build_features_creates_correct_structure(self, mock_lerobot_dataset):
         # Access the private method through the instance
         features = recorder._build_features()
 
-        # Check expected features exist
-        assert "observation.qpos" in features
-        assert "observation.qvel" in features
-        assert "observation.qf" in features
-        assert "action" in features
+        assert LeRobotKey.OBS_STATE.value in features
+        assert LeRobotKey.ACTION.value in features
 
         # Check shapes
-        assert features["observation.qpos"]["shape"] == (6,)
-        assert features["action"]["shape"] == (6,)
+        assert features[LeRobotKey.OBS_STATE.value]["shape"] == (6,)
+        assert features[LeRobotKey.ACTION.value]["shape"] == (6,)
 
     @patch("embodichain.lab.gym.envs.managers.datasets.LeRobotDataset")
     def test_build_features_with_sensor(self, mock_lerobot_dataset):
@@ -328,8 +327,8 @@ def test_convert_frame_with_tensor_action(self, mock_lerobot_dataset):
 
         assert "task" in frame
         assert frame["task"] == "test_task"
-        assert "observation.qpos" in frame
-        assert "action" in frame
+        assert LeRobotKey.OBS_STATE.value in frame
+        assert LeRobotKey.ACTION.value in frame
 
 
 class TestDatasetFunctorCfg:

From 3608353fb502733ab933a091fcbe4b3c8540ebb9 Mon Sep 17 00:00:00 2001
From: yuanhaonan <yuanhaonan@dexforce.top>
Date: Mon, 25 May 2026 14:17:33 +0800
Subject: [PATCH 2/4] black

---
 embodichain/lab/gym/envs/managers/datasets.py    | 10 +++++++---
 tests/gym/envs/managers/test_dataset_functors.py |  1 +
 2 files changed, 8 insertions(+), 3 deletions(-)

diff --git a/embodichain/lab/gym/envs/managers/datasets.py b/embodichain/lab/gym/envs/managers/datasets.py
index f84f5875..7fd0004d 100644
--- a/embodichain/lab/gym/envs/managers/datasets.py
+++ b/embodichain/lab/gym/envs/managers/datasets.py
@@ -314,7 +314,9 @@ def _build_features(self) -> Dict:
                         }
 
                         if is_stereo:
-                            features[f"{LeRobotKey.OBS_IMAGES.value}.{sensor_name}_right"] = {
+                            features[
+                                f"{LeRobotKey.OBS_IMAGES.value}.{sensor_name}_right"
+                            ] = {
                                 "dtype": "video" if self.use_videos else "image",
                                 "shape": (sensor.cfg.height, sensor.cfg.width, 3),
                                 "names": ["height", "width", "channel"],
@@ -459,7 +461,9 @@ def _convert_frame_to_lerobot(
                     if is_stereo:
                         color_right_data = obs["sensor"][sensor_name]["color_right"]
                         color_right_img = color_right_data[:, :, :3].cpu()
-                        frame[f"{LeRobotKey.OBS_IMAGES.value}.{sensor_name}_right"] = color_right_img
+                        frame[f"{LeRobotKey.OBS_IMAGES.value}.{sensor_name}_right"] = (
+                            color_right_img
+                        )
                 elif isinstance(sensor, ContactSensor):
                     for frame_name in value.keys():
                         frame[f"{sensor_name}.{frame_name}"] = obs["sensor"][
@@ -550,4 +554,4 @@ def _update_dataset_info(self, updates: dict) -> bool:
             return True
         except Exception as e:
             logger.log_error(f"Failed to update dataset info: {e}")
-            return False
\ No newline at end of file
+            return False
diff --git a/tests/gym/envs/managers/test_dataset_functors.py b/tests/gym/envs/managers/test_dataset_functors.py
index fe416eb4..3a782048 100644
--- a/tests/gym/envs/managers/test_dataset_functors.py
+++ b/tests/gym/envs/managers/test_dataset_functors.py
@@ -30,6 +30,7 @@
     )
 
     from embodichain.data.enum import LeRobotKey
+
     LEROBOT_AVAILABLE = True
 except ImportError:
     LEROBOT_AVAILABLE = False

From 1161e1e07bcfb494a6a86cfadc46b719768e83c8 Mon Sep 17 00:00:00 2001
From: yuanhaonan <yuanhaonan@dexforce.top>
Date: Mon, 25 May 2026 14:49:00 +0800
Subject: [PATCH 3/4] add observation qvel qf

---
 embodichain/data/enum.py                      |  2 ++
 embodichain/lab/gym/envs/managers/datasets.py | 13 +++++++++++++
 2 files changed, 15 insertions(+)

diff --git a/embodichain/data/enum.py b/embodichain/data/enum.py
index 78f32fe5..145fa71a 100644
--- a/embodichain/data/enum.py
+++ b/embodichain/data/enum.py
@@ -83,6 +83,8 @@ class LeRobotKey(Enum):
     OBS_PREFIX = "observation."
     OBS_ENV_STATE = "observation.environment_state"
     OBS_STATE = "observation.state"
+    OBS_QVEL = "observation.qvel"
+    OBS_QF = "observation.qf"
     OBS_IMAGE = "observation.image"
     OBS_IMAGES = "observation.images"
     OBS_LANGUAGE = "observation.language"
diff --git a/embodichain/lab/gym/envs/managers/datasets.py b/embodichain/lab/gym/envs/managers/datasets.py
index 7fd0004d..796fef09 100644
--- a/embodichain/lab/gym/envs/managers/datasets.py
+++ b/embodichain/lab/gym/envs/managers/datasets.py
@@ -281,6 +281,16 @@ def _build_features(self) -> Dict:
             "shape": (state_dim,),
             "names": joint_names,
         }
+        features[LeRobotKey.OBS_QVEL.value] = {
+            "dtype": "float32",
+            "shape": (state_dim,),
+            "names": joint_names,
+        }
+        features[LeRobotKey.OBS_QF.value] = {
+            "dtype": "float32",
+            "shape": (state_dim,),
+            "names": joint_names,
+        }
 
         # Use full qpos dimension for action (includes gripper)
         action_dim = state_dim
@@ -478,6 +488,9 @@ def _convert_frame_to_lerobot(
 
         # Add state (use LeRobot standard key "observation.state")
         frame[LeRobotKey.OBS_STATE.value] = obs["robot"]["qpos"].cpu()
+        # Keep additional proprio data that may be useful even though not in official LeRobot format
+        frame[LeRobotKey.OBS_QVEL.value] = obs["robot"]["qvel"].cpu()
+        frame[LeRobotKey.OBS_QF.value] = obs["robot"]["qf"].cpu()
 
         # Add extra observation features if they exist
         for key in obs.keys():

From 6df55c17842e17db7fb4446a92629b68741bff56 Mon Sep 17 00:00:00 2001
From: yuanhaonan <yuanhaonan@dexforce.top>
Date: Mon, 25 May 2026 17:19:17 +0800
Subject: [PATCH 4/4] fix unittest

---
 tests/gym/envs/managers/test_dataset_functors.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/tests/gym/envs/managers/test_dataset_functors.py b/tests/gym/envs/managers/test_dataset_functors.py
index 3a782048..41d5bf89 100644
--- a/tests/gym/envs/managers/test_dataset_functors.py
+++ b/tests/gym/envs/managers/test_dataset_functors.py
@@ -276,8 +276,8 @@ def mock_isinstance(obj, class_or_tuple):
             recorder = LeRobotRecorder(cfg, env)
             features = recorder._build_features()
 
-        # Check camera feature exists
-        assert "camera.color" in features
+        # Check camera feature exists (use LeRobot standard key format)
+        assert f"{LeRobotKey.OBS_IMAGES.value}.camera" in features
 
 
 @pytest.mark.skipif(not LEROBOT_AVAILABLE, reason="LeRobot not installed")