add dataset collection node

8 months ago · 1388c5249c
--- a/examples/lerobot-dataset-record/dataflow.yml
+++ b/examples/lerobot-dataset-record/dataflow.yml
@@ -0,0 +1,88 @@
 nodes:
  - id: laptop_cam
    build: pip install opencv-video-capture
    path: opencv-video-capture
    inputs:
      tick: dora/timer/millis/33
    outputs:
      - image
    env:
      CAPTURE_PATH: "0"
      ENCODING: "rgb8"
      IMAGE_WIDTH: "640"
      IMAGE_HEIGHT: "480"

  - id: front_cam
    build: pip install opencv-video-capture
    path: opencv-video-capture
    inputs:
      tick: dora/timer/millis/33
    outputs:
      - image
    env:
      CAPTURE_PATH: "2"
      ENCODING: "rgb8"
      IMAGE_WIDTH: "640"
      IMAGE_HEIGHT: "480"

  - id: so101
    build: pip install -e ../../node-hub/dora-rustypot
    path: dora-rustypot
    inputs:
      tick: dora/timer/millis/10
      pose: leader_interface/pose
    outputs:
      - pose
    env:
      PORT: "/dev/ttyACM1"
      IDS: "1,2,3,4,5,6"

  - id: leader_interface
    path: dora-rustypot
    build: pip install -e ../../node-hub/dora-rustypot
    inputs:
      tick: dora/timer/millis/10
    outputs:
      - pose
    env:
      PORT: "/dev/ttyACM0"
      IDS: "1,2,3,4,5,6"

  - id: lerobot_recorder
    build: pip install -e ../../node-hub/dora-dataset-record
    path: dora-dataset-record
    inputs:
      laptop: laptop_cam/image
      front: front_cam/image
      robot_state: so101/pose
      robot_action: leader_interface/pose
    outputs:
      - text
    env:
      REPO_ID: "HF_username/name_of_dataset"
      SINGLE_TASK: "Pick up the cube and place it in the box"
      ROBOT_TYPE: "your robot type" # e.g., "so101_follower", "ur5e" etc

      FPS: "30"
      TOTAL_EPISODES: "5"
      EPISODE_DURATION_S: "60"
      RESET_DURATION_S: "15"
      
      CAMERA_NAMES: "laptop, front"
      CAMERA_LAPTOP_RESOLUTION: "480,640,3"
      CAMERA_FRONT_RESOLUTION: "480,640,3"
      ROBOT_JOINTS: "shoulder_pan.pos,shoulder_lift.pos,elbow_flex.pos,wrist_flex.pos,wrist_roll.pos,gripper.pos"

      # ROOT_PATH: "path where you want to save the dataset" # if not set, will save to ~.cache/huggingface/lerobot
      USE_VIDEOS: "true"
      PUSH_TO_HUB: "false"
      PRIVATE: "false"
      TAGS: "robotics, manipulation"

  - id: plot
    build: pip install dora-rerun
    path: dora-rerun
    inputs:
      image_laptop: laptop_cam/image
      image_front: front_cam/image
      text: lerobot_recorder/text
--- a/node-hub/dora-dataset-record/README.md
+++ b/node-hub/dora-dataset-record/README.md
@@ -0,0 +1,40 @@
 # dora-dataset-record

 ## Getting started

 - Install it with uv:

 ```bash
 uv venv -p 3.11 --seed
 uv pip install -e .
 ```

 ## Contribution Guide

 - Format with [ruff](https://docs.astral.sh/ruff/):

 ```bash
 uv pip install ruff
 uv run ruff check . --fix
 ```

 - Lint with ruff:

 ```bash
 uv run ruff check .
 ```

 - Test with [pytest](https://github.com/pytest-dev/pytest)

 ```bash
 uv pip install pytest
 uv run pytest . # Test
 ```

 ## YAML Specification

 ## Examples

 ## License

 dora-dataset-record's code are released under the MIT License
--- a/node-hub/dora-dataset-record/dora_dataset_record/init.py
+++ b/node-hub/dora-dataset-record/dora_dataset_record/init.py
@@ -0,0 +1,11 @@
 import os

 # Define the path to the README file relative to the package directory
 readme_path = os.path.join(os.path.dirname(os.path.dirname(__file__)), "README.md")

 # Read the content of the README file
 try:
    with open(readme_path, encoding="utf-8") as f:
        __doc__ = f.read()
 except FileNotFoundError:
    __doc__ = "README file not found."
--- a/node-hub/dora-dataset-record/dora_dataset_record/main.py
+++ b/node-hub/dora-dataset-record/dora_dataset_record/main.py
@@ -0,0 +1,5 @@
 from .main import main


 if __name__ == "__main__":
    main()
--- a/node-hub/dora-dataset-record/dora_dataset_record/main.py
+++ b/node-hub/dora-dataset-record/dora_dataset_record/main.py
@@ -0,0 +1,348 @@
 """TODO: Add docstring."""

 from dora import Node
 import pyarrow as pa
 import os
 import time
 import numpy as np
 import threading
 import queue
 import cv2
 from typing import Any
 from lerobot.common.datasets.lerobot_dataset import LeRobotDataset

 class DoraLeRobotRecorder:
    """Recorder class for LeRobot dataset."""

    def __init__(self):
        """Initialize the Recorder node."""
        self.message_queue = queue.Queue()

        self.dataset = None
        self.episode_active = False
        self.frame_count = 0

        self.data_buffer = {}
        self.buffer_lock = threading.Lock()

        self.episode_index = 0
        self.start_time = None
        self.cameras = self._get_cameras()
        self.total_episodes = int(os.getenv("TOTAL_EPISODES", "10")) # Default to 10 episodes
        self.episode_duration = int(os.getenv("EPISODE_DURATION_S", "60")) # Default to 60 seconds
        self.reset_duration = int(os.getenv("RESET_DURATION_S", "15")) # Default to 15 seconds
        self.fps = int(os.getenv("FPS", "30")) # Default to 30 FPS

        self.recording_started = False
        self.in_reset_phase = False
        self.last_episode = False
        self.reset_start_time = None

        self.frame_interval = 1.0 / self.fps
        self.last_frame_time = None
        self.shutdown = False

        self._setup_dataset()
        self._start_frame_timer()

    def _get_cameras(self) -> dict:
        """Get Camera config."""
        camera_names_str = os.getenv("CAMERA_NAMES")
        if camera_names_str:
            camera_names = [name.strip() for name in camera_names_str.split(',')]
        else:
            return {}

        cameras = {}
        for camera_name in camera_names:
            resolution = os.getenv(f"CAMERA_{camera_name.upper()}_RESOLUTION")
            if resolution:
                dims = [int(d.strip()) for d in resolution.split(',')]
                cameras[camera_name] = dims
            else:
                print(f"Warning: Set CAMERA_{camera_name.upper()}_RESOLUTION: \"height,width,channels\"")

        return cameras

    def _get_robot_joints(self) -> list:
        """Get robot joints."""
        joints_str = os.getenv("ROBOT_JOINTS")
        if joints_str:
            return [joint.strip() for joint in joints_str.split(',')]
        else:
            raise ValueError("ROBOT_JOINTS are not set.")

    def _get_tags(self) -> list:
        """Get tags for dataset."""
        tags_str = os.getenv("TAGS")
        if tags_str:
            return [tag.strip() for tag in tags_str.split(',')]
        return []

    def _setup_dataset(self):
        """Set up the LeRobot Dataset."""
        features = {}

        joint_names = self._get_robot_joints()
        features["action"] = {
            "dtype": "float32", 
            "shape": (len(joint_names),),
            "names": joint_names}
        features["observation.state"] = {
            "dtype": "float32",
            "shape": (len(joint_names),),
            "names": joint_names}

        self.use_videos = os.getenv("USE_VIDEOS", "true").lower() == "true"
        for camera_name in self.cameras:
            features[f"observation.images.{camera_name}"] = {
                "dtype": "video" if self.use_videos else "image",
                "shape": self.cameras[camera_name],
                "names": ["height", "width", "channels"]}

        self.required_features = set(features.keys())

        features.update({
            "timestamp": {"dtype": "float32", "shape": [1]},
            "frame_index": {"dtype": "int64", "shape": [1]},
            "episode_index": {"dtype": "int64", "shape": [1]},
            "index": {"dtype": "int64", "shape": [1]},
            "task_index": {"dtype": "int64", "shape": [1]},
        })

        repo_id = os.getenv("REPO_ID", None)
        if repo_id is None:
            raise ValueError("REPO_ID environment variable must be set to create dataset")

        self.dataset = LeRobotDataset.create(
            repo_id=repo_id,
            fps=self.fps,
            features=features,
            root=os.getenv("ROOT_PATH", None),
            robot_type=os.getenv("ROBOT_TYPE", "your_robot_type"),
            use_videos=self.use_videos,
            image_writer_processes=int(os.getenv("IMAGE_WRITER_PROCESSES", "0")),
            image_writer_threads=int(os.getenv("IMAGE_WRITER_THREADS", "4")) * len(self.cameras),
        )

    def _check_episode_timing(self):
        """Check if we need to start/end Episodes."""
        current_time = time.time()

        if not self.recording_started:  # Start the first episode
            self._start_episode()
            self.recording_started = True
            return False

        # If in reset phase, check if reset time is over
        if self.in_reset_phase or self.last_episode:
            if current_time - self.reset_start_time >= self.reset_duration:
                self.in_reset_phase = False
                if self.episode_index < self.total_episodes:
                    self._start_episode()
                else:
                    self._output(f"All {self.total_episodes} episodes completed!")
                    return True
            return False

        # If episode is active, check if episode time is over
        if self.episode_active:
            if (current_time - self.start_time) >= self.episode_duration:
                self._end_episode()
                if self.episode_index < self.total_episodes:
                    self._start_reset_phase()
                else:
                    self.last_episode = True

        return False

    def _start_episode(self):
        """Start a new episode."""
        self.episode_active = True
        self.start_time = time.time()
        self.frame_count = 0
        self._output(f"Started episode {self.episode_index + 1}/{self.total_episodes}")

    def _end_episode(self):
        """End current episode and save to dataset."""
        self.episode_active = False
        if self.frame_count > 0:
            self._output(f"Saving episode index {self.episode_index} with {self.frame_count} frames")
            self.dataset.save_episode()
            self.episode_index += 1
        else:
            self._output(f"Episode {self.episode_index} had no frames, skipping save")

    def _start_reset_phase(self):
        """Start the reset phase between episodes."""
        self.in_reset_phase = True
        self.reset_start_time = time.time()
        self._output(f"Reset phase started - {self.reset_duration}s break before next episode...")

    def _start_frame_timer(self):
        """Start the frame timer thread."""
        self.stop_timer = False
        self.frame_timer_thread = threading.Thread(target=self._frame_timer_loop, daemon=True)
        self.frame_timer_thread.start()

    def _frame_timer_loop(self):
        """Frame timing loop."""
        while not self.stop_timer and not self.shutdown:
            current_time = time.time()

            if self.episode_active and not self.in_reset_phase and (
                self.last_frame_time is None or 
                current_time - self.last_frame_time >= self.frame_interval
            ):
                self._add_frame()
                self.last_frame_time = current_time

            should_stop = self._check_episode_timing()
            if should_stop:
                self.stop_timer = True  # Signal to stop the timer
                break

            time.sleep(0.001)

    def handle_input(self, input_id: str, data: Any, metadata: Any):
        """Handle incoming data - Store the latest data."""
        # Only store data if not in reset phase
        if not self.in_reset_phase:
            with self.buffer_lock:
                self.data_buffer[input_id] = {
                    "data": data,
                    "timestamp": time.time(),
                    "metadata": metadata
                }

        should_stop = self._check_episode_timing()
        if should_stop:
            self.shutdown = True

        return should_stop

    def _shutdown(self):
        """Shutdown the Recorder."""
        print("Shutting down recorder...")

        # Signal shutdown
        self.shutdown = True
        self.stop_timer = True

        if self.frame_timer_thread.is_alive():
            print("Waiting for frame timer thread to finish...")
            self.frame_timer_thread.join(timeout=5.0)
        else:
            print("Frame timer thread finished successfully")

        self.finalize_dataset()
        print("Recorder shutdown complete")

    def _convert_camera_data(self, dora_data, metadata) -> np.ndarray:
        """Convert camera data from 1D pyarrow array to numpy format."""
        height, width = metadata.get("height"), metadata.get("width")
        encoding = metadata.get("encoding")
        image = dora_data.to_numpy().reshape(height, width, 3)  

        if encoding == "bgr8":
            image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        elif encoding == "yuv420":
            image = cv2.cvtColor(image, cv2.COLOR_YUV2RGB_I420)

        return image.astype(np.uint8)

    def convert_robot_data(self, dora_data, convert_degrees=True) -> np.ndarray:
        """Convert robot joint data, LeRobot expects angles in degrees and float32."""
        joint_array = dora_data.to_numpy()
        if convert_degrees:
            joint_array = np.rad2deg(joint_array)
        return joint_array.astype(np.float32)

    def _add_frame(self):
        """Add a frame to the dataset."""
        with self.buffer_lock:
            frame_data = {}
            ideal_timestamp = self.frame_count / self.fps

            for key, value in self.data_buffer.items():
                if key == "robot_action":
                    frame_data["action"] = self.convert_robot_data(self.data_buffer["robot_action"]["data"])
                if key == "robot_state":
                    frame_data["observation.state"] = self.convert_robot_data(self.data_buffer["robot_state"]["data"])
                if {'height', 'width'} <= value.get('metadata', {}).keys():
                    camera_name = key
                    image = self._convert_camera_data(
                        self.data_buffer[camera_name]["data"],
                        self.data_buffer[camera_name]["metadata"]
                    )
                    frame_data[f"observation.images.{camera_name}"] = image

            missing_keys = self.required_features - set(frame_data.keys())  # Ensure all required features are present 
            if missing_keys:
                print(f"Missing required data in frame: {missing_keys}")
                return

            self.dataset.add_frame(
                frame=frame_data,
                task=os.getenv("SINGLE_TASK", "Your task"),
                timestamp=ideal_timestamp
            )
            self.frame_count += 1

    def finalize_dataset(self):
        """Finalize dataset and optionally push to hub."""
        if self.episode_active:
            self._end_episode()

        if self.use_videos:
            self._output("Encoding videos...")
            self.dataset.encode_videos()

        if os.getenv("PUSH_TO_HUB", "false").lower() == "true":
            self._output("Pushing dataset to hub...")
            self.dataset.push_to_hub(
                tags=self._get_tags(),
                private=os.getenv("PRIVATE", "false").lower() == "true"
            )

        self._output(f"Dataset recording completed. Total episodes: {self.episode_index}")

    def _output(self, message: str):
        """Output message."""
        # Put message in queue to send
        self.message_queue.put(message)

    def get_pending_messages(self):
        """Get all pending messages from the queue."""
        messages = []
        while not self.message_queue.empty():
            messages.append(self.message_queue.get_nowait())
        return messages

 def main():
    node = Node()
    recorder = DoraLeRobotRecorder()

    print("Starting dataset recording")
    print(f"Total episodes: {recorder.total_episodes}")
    print(f"Episode duration: {recorder.episode_duration}s")
    print(f"Reset duration: {recorder.reset_duration}s")

    for event in node:
        pending_messages = recorder.get_pending_messages()
        for message in pending_messages:
            node.send_output(
                output_id="text",
                data=pa.array([message]),
                metadata={})

        if event["type"] == "INPUT":
            should_stop = recorder.handle_input(event["id"], event["value"], event.get("metadata", {}))
            if should_stop:
                print("All episodes completed, stopping recording...")
                break

    recorder._shutdown()

 if __name__ == "__main__":
    main()
--- a/node-hub/dora-dataset-record/pyproject.toml
+++ b/node-hub/dora-dataset-record/pyproject.toml
@@ -0,0 +1,31 @@
 [project]
 name = "dora-dataset-record"
 version = "0.1.0"
 authors = [{ name = "Shashwat Patil", email = "email@email.com" }]
 description = "dora-dataset-record"
 license = { text = "MIT" }
 readme = "README.md"
 requires-python = ">=3.8"

 dependencies = ["dora-rs >= 0.3.9","pyarrow","lerobot"]

 [dependency-groups]
 dev = ["pytest >=8.1.1", "ruff >=0.9.1"]

 [project.scripts]
 dora-dataset-record = "dora_dataset_record.main:main"

 [tool.ruff.lint]
 extend-select = [
  "D",   # pydocstyle
  "UP"
 ]
 ignore = [
  "D100",  # Missing docstring in public module
  "D103",  # Missing docstring in public function
  "D104",  # Missing docstring in public package
 ]

 [tool.uv.sources]
 lerobot = {git = "https://github.com/huggingface/lerobot.git" }

--- a/node-hub/dora-dataset-record/tests/test_dora_dataset_record.py
+++ b/node-hub/dora-dataset-record/tests/test_dora_dataset_record.py
@@ -0,0 +1,13 @@
 """Test module for dora_dataset_record package."""

 import pytest


 def test_import_main():
    """Test importing and running the main function."""
    from dora_dataset_record.main import main

    # Check that everything is working, and catch Dora RuntimeError
    # as we're not running in a Dora dataflow.
    with pytest.raises(RuntimeError):
        main()