Add robot_devices and control_robot script

2024-07-02 21:09:00 +02:00
parent e410e5d711
commit 858d49fc04
11 changed files with 1588 additions and 23 deletions
--- a/lerobot/common/robot_devices/cameras/opencv.py
+++ b/lerobot/common/robot_devices/cameras/opencv.py
@@ -0,0 +1,249 @@
+
+
+import argparse
+from dataclasses import dataclass, replace
+from pathlib import Path
+from threading import Thread
+import time
+import cv2
+import numpy as np
+
+from lerobot.common.robot_devices.cameras.utils import save_color_image
+
+
+def find_camera_indices(raise_when_empty=False, max_index_search_range=60):
+    camera_ids = []
+    for camera_idx in range(max_index_search_range):
+        camera = cv2.VideoCapture(camera_idx)
+        is_open = camera.isOpened()
+        camera.release()
+
+        if is_open:
+            print(f"Camera found at index {camera_idx}")
+            camera_ids.append(camera_idx)
+
+    if raise_when_empty and len(camera_ids) == 0:
+        raise OSError("Not a single camera was detected. Try re-plugging, or re-installing `opencv2`, or your camera driver, or make sure your camera is compatible with opencv2.")
+
+    return camera_ids
+
+def benchmark_cameras(cameras, out_dir=None, save_images=False, num_warmup_frames=4):
+    if out_dir:
+        out_dir = Path(out_dir)
+        out_dir.mkdir(parents=True, exist_ok=True)
+
+    for _ in range(num_warmup_frames):
+        for camera in cameras:
+            try:
+                camera.capture_image()
+                time.sleep(0.01)
+            except OSError as e:
+                print(e)
+
+    while True:
+        now = time.time()
+        for camera in cameras:
+            color_image = camera.capture_image("bgr" if save_images else "rgb")
+
+            if save_images:
+                image_path = out_dir / f"camera_{camera.camera_index:02}.png"
+                print(f"Write to {image_path}")
+                save_color_image(color_image, image_path, write_shape=True)
+
+        dt_s = (time.time() - now)
+        dt_ms = dt_s * 1000
+        freq = 1 / dt_s
+        print(f"Latency (ms): {dt_ms:.2f}\tFrequency: {freq:.2f}")
+
+        if save_images:
+            break
+        if cv2.waitKey(1) & 0xFF == ord("q"):
+            break
+
+
+@dataclass
+class OpenCVCameraConfig:
+    """
+    Example of tested options for Intel Real Sense D405:
+    
+    ```python
+    OpenCVCameraConfig(30, 640, 480)
+    OpenCVCameraConfig(60, 640, 480)
+    OpenCVCameraConfig(90, 640, 480)
+    OpenCVCameraConfig(30, 1280, 720)
+    ```
+    """
+    fps: int | None = None
+    width: int | None = None
+    height: int | None = None
+    color: str = "rgb"
+
+
+
+class OpenCVCamera():
+    # TODO(rcadene): improve dosctring
+    """
+    https://docs.opencv.org/4.x/d0/da7/videoio_overview.html
+    https://docs.opencv.org/4.x/d4/d15/group__videoio__flags__base.html#ga023786be1ee68a9105bf2e48c700294d
+
+    Example of uage:
+
+    ```python
+    camera = OpenCVCamera(2)
+    color_image = camera.capture_image()
+    ```
+    """
+    def __init__(self, camera_index: int, config: OpenCVCameraConfig | None = None, **kwargs):
+        if config is None:
+            config = OpenCVCameraConfig()
+        # Overwrite config arguments using kwargs
+        config = replace(config, **kwargs)
+
+        self.camera_index = camera_index
+        self.fps = config.fps
+        self.width = config.width
+        self.height = config.height
+        self.color = config.color
+
+        if self.color not in ["rgb", "bgr"]:
+            raise ValueError(f"Expected color values are 'rgb' or 'bgr', but {self.color} is provided.")
+
+        if self.camera_index is None:
+            raise ValueError(f"`camera_index` is expected to be one of these available cameras {OpenCVCamera.AVAILABLE_CAMERAS_INDICES}, but {camera_index} is provided instead.")
+        
+        self.camera = None
+        self.is_connected = False
+
+        self.t = Thread(target=self.capture_image_loop, args=())
+        self.t.daemon = True
+        self._color_image = None
+
+    def connect(self):
+        if self.is_connected:
+            raise ValueError(f"Camera {self.camera_index} is already connected.")
+
+        # First create a temporary camera trying to access `camera_index`,
+        # and verify it is a valid camera by calling `isOpened`.
+        tmp_camera = cv2.VideoCapture(self.camera_index)
+        is_camera_open = tmp_camera.isOpened()
+        # Release camera to make it accessible for `find_camera_indices`
+        del tmp_camera
+
+        # If the camera doesn't work, display the camera indices corresponding to
+        # valid cameras.
+        if not is_camera_open:
+            # Verify that the provided `camera_index` is valid before printing the traceback
+            if self.camera_index not in find_camera_indices():
+                raise ValueError(f"`camera_index` is expected to be one of these available cameras {OpenCVCamera.AVAILABLE_CAMERAS_INDICES}, but {self.camera_index} is provided instead.")
+
+            raise OSError(f"Can't access camera {self.camera_index}.")
+        
+        # Secondly, create the camera that will be used downstream.
+        # Note: For some unknown reason, calling `isOpened` blocks the camera which then
+        # needs to be re-created.
+        self.camera = cv2.VideoCapture(self.camera_index)
+
+        if self.fps:
+            self.camera.set(cv2.CAP_PROP_FPS, self.fps)
+        if self.width:
+            self.camera.set(cv2.CAP_PROP_FRAME_WIDTH, self.width)
+        if self.height:
+            self.camera.set(cv2.CAP_PROP_FRAME_HEIGHT, self.height)
+
+        actual_fps = self.camera.get(cv2.CAP_PROP_FPS)
+        actual_width = self.camera.get(cv2.CAP_PROP_FRAME_WIDTH)
+        actual_height = self.camera.get(cv2.CAP_PROP_FRAME_HEIGHT)
+
+        if self.fps and self.fps != actual_fps:
+            raise OSError(f"Can't set {self.fps=} for camera {self.camera_index}. Actual value is {actual_fps}.")
+        if self.width and self.width != actual_width:
+            raise OSError(f"Can't set {self.width=} for camera {self.camera_index}. Actual value is {actual_width}.")
+        if self.height and self.height != actual_height:
+            raise OSError(f"Can't set {self.height=} for camera {self.camera_index}. Actual value is {actual_height}.")
+        
+        self.is_connected = True
+        self.t.start()
+
+    def capture_image(self, temporary_color: str | None = None) -> np.ndarray:
+        if not self.is_connected:
+            self.connect()
+
+        ret, color_image = self.camera.read()
+        if not ret:
+            raise OSError(f"Can't capture color image from camera {self.camera_index}.")
+
+        if temporary_color is None:
+            requested_color = self.color
+        else:
+            requested_color = temporary_color
+        
+        if requested_color not in ["rgb", "bgr"]:
+            raise ValueError(f"Expected color values are 'rgb' or 'bgr', but {requested_color} is provided.")
+        
+        # OpenCV uses BGR format as default (blue, green red) for all operations, including displaying images.
+        # However, Deep Learning framework such as LeRobot uses RGB format as default to train neural networks,
+        # so we convert the image color from BGR to RGB.
+        if requested_color == "rgb":
+            color_image = cv2.cvtColor(color_image, cv2.COLOR_BGR2RGB)
+        
+        return color_image
+    
+    def capture_image_loop(self):
+        while True:
+            self._color_image = self.capture_image()
+
+    def read(self):
+        while self._color_image is None:
+            time.sleep(0.1)
+        return self._color_image
+
+    def disconnect(self):
+        if getattr(self, "camera", None):
+            self.camera.release()
+
+    def __del__(self):
+        self.disconnect()
+
+
+def save_images_config(config: OpenCVCameraConfig, out_dir: Path):
+    cameras = []
+    print(f"Available camera indices: {OpenCVCamera.AVAILABLE_CAMERAS_INDICES}")
+    for camera_idx in OpenCVCamera.AVAILABLE_CAMERAS_INDICES:
+        camera = OpenCVCamera(camera_idx, config)
+        cameras.append(camera)
+
+    out_dir = out_dir.parent / f"{out_dir.name}_{config.width}x{config.height}_{config.fps}"
+    benchmark_cameras(cameras, out_dir, save_images=True)
+
+def benchmark_config(config: OpenCVCameraConfig, camera_ids: list[int]):
+    cameras = [OpenCVCamera(idx, config) for idx in camera_ids]
+    benchmark_cameras(cameras)
+
+
+if __name__ == "__main__":
+    parser = argparse.ArgumentParser()
+    parser.add_argument("--mode", type=str, choices=["save_images", 'benchmark'], default="save_images")
+    parser.add_argument("--camera-ids", type=int, nargs="*", default=[16, 4, 22, 10])
+    parser.add_argument("--fps", type=int, default=30)
+    parser.add_argument("--width", type=str, default=640)
+    parser.add_argument("--height", type=str, default=480)
+    parser.add_argument("--out-dir", type=Path, default="outputs/benchmark_cameras/opencv/2024_06_22_1727")
+    args = parser.parse_args()
+
+    config = OpenCVCameraConfig(args.fps, args.width, args.height)
+    # config = OpenCVCameraConfig()
+    # config = OpenCVCameraConfig(60, 640, 480)
+    # config = OpenCVCameraConfig(90, 640, 480)
+    # config = OpenCVCameraConfig(30, 1280, 720)
+
+    if args.mode == "save_images":
+        save_images_config(config, args.out_dir)
+    elif args.mode == "benchmark":
+        benchmark_config(config, args.camera_ids)
+    else:
+        raise ValueError(args.mode)
+    
+    
+    
+
+