Enable CI for robot devices with mocked versions (#398)

Co-authored-by: Simon Alibert <75076266+aliberts@users.noreply.github.com>
2024-10-03 17:05:23 +02:00
parent 72f402d44b
commit 26f97cfd17
18 changed files with 1053 additions and 237 deletions
--- a/lerobot/common/robot_devices/cameras/opencv.py
+++ b/lerobot/common/robot_devices/cameras/opencv.py
@@ -13,7 +13,6 @@ from dataclasses import dataclass, replace
 from pathlib import Path
 from threading import Thread

-import cv2
 import numpy as np
 from PIL import Image

@@ -24,10 +23,6 @@ from lerobot.common.robot_devices.utils import (
 )
 from lerobot.common.utils.utils import capture_timestamp_utc

-# Use 1 thread to avoid blocking the main thread. Especially useful during data collection
-# when other threads are used to save the images.
-cv2.setNumThreads(1)
-
 # The maximum opencv device index depends on your operating system. For instance,
 # if you have 3 cameras, they should be associated to index 0, 1, and 2. This is the case
 # on MacOS. However, on Ubuntu, the indices are different like 6, 16, 23.
@@ -36,7 +31,7 @@ cv2.setNumThreads(1)
 MAX_OPENCV_INDEX = 60


-def find_camera_indices(raise_when_empty=False, max_index_search_range=MAX_OPENCV_INDEX):
+def find_camera_indices(raise_when_empty=False, max_index_search_range=MAX_OPENCV_INDEX, mock=False):
    if platform.system() == "Linux":
        # Linux uses camera ports
        print("Linux detected. Finding available camera indices through scanning '/dev/video*' ports")
@@ -51,9 +46,14 @@ def find_camera_indices(raise_when_empty=False, max_index_search_range=MAX_OPENC
        )
        possible_camera_ids = range(max_index_search_range)

+    if mock:
+        from tests.mock_cv2 import VideoCapture
+    else:
+        from cv2 import VideoCapture
+
    camera_ids = []
    for camera_idx in possible_camera_ids:
-        camera = cv2.VideoCapture(camera_idx)
+        camera = VideoCapture(camera_idx)
        is_open = camera.isOpened()
        camera.release()

@@ -78,19 +78,25 @@ def save_image(img_array, camera_index, frame_index, images_dir):


 def save_images_from_cameras(
-    images_dir: Path, camera_ids: list[int] | None = None, fps=None, width=None, height=None, record_time_s=2
+    images_dir: Path,
+    camera_ids: list[int] | None = None,
+    fps=None,
+    width=None,
+    height=None,
+    record_time_s=2,
+    mock=False,
 ):
    """
    Initializes all the cameras and saves images to the directory. Useful to visually identify the camera
    associated to a given camera index.
    """
    if camera_ids is None:
-        camera_ids = find_camera_indices()
+        camera_ids = find_camera_indices(mock=mock)

    print("Connecting cameras")
    cameras = []
    for cam_idx in camera_ids:
-        camera = OpenCVCamera(cam_idx, fps=fps, width=width, height=height)
+        camera = OpenCVCamera(cam_idx, fps=fps, width=width, height=height, mock=mock)
        camera.connect()
        print(
            f"OpenCVCamera({camera.camera_index}, fps={camera.fps}, width={camera.width}, "
@@ -156,6 +162,7 @@ class OpenCVCameraConfig:
    width: int | None = None
    height: int | None = None
    color_mode: str = "rgb"
+    mock: bool = False

    def __post_init__(self):
        if self.color_mode not in ["rgb", "bgr"]:
@@ -215,6 +222,7 @@ class OpenCVCamera:
        self.width = config.width
        self.height = config.height
        self.color_mode = config.color_mode
+        self.mock = config.mock

        self.camera = None
        self.is_connected = False
@@ -227,17 +235,33 @@ class OpenCVCamera:
        if self.is_connected:
            raise RobotDeviceAlreadyConnectedError(f"OpenCVCamera({self.camera_index}) is already connected.")

+        if self.mock:
+            from tests.mock_cv2 import (
+                CAP_PROP_FPS,
+                CAP_PROP_FRAME_HEIGHT,
+                CAP_PROP_FRAME_WIDTH,
+                VideoCapture,
+            )
+        else:
+            from cv2 import (
+                CAP_PROP_FPS,
+                CAP_PROP_FRAME_HEIGHT,
+                CAP_PROP_FRAME_WIDTH,
+                VideoCapture,
+                setNumThreads,
+            )
+
+            # Use 1 thread to avoid blocking the main thread. Especially useful during data collection
+            # when other threads are used to save the images.
+            setNumThreads(1)
+
+        camera_idx = f"/dev/video{self.camera_index}" if platform.system() == "Linux" else self.camera_index
        # First create a temporary camera trying to access `camera_index`,
        # and verify it is a valid camera by calling `isOpened`.
-
-        if platform.system() == "Linux":
-            # Linux uses ports for connecting to cameras
-            tmp_camera = cv2.VideoCapture(f"/dev/video{self.camera_index}")
-        else:
-            tmp_camera = cv2.VideoCapture(self.camera_index)
-
+        tmp_camera = VideoCapture(camera_idx)
        is_camera_open = tmp_camera.isOpened()
        # Release camera to make it accessible for `find_camera_indices`
+        tmp_camera.release()
        del tmp_camera

        # If the camera doesn't work, display the camera indices corresponding to
@@ -251,28 +275,27 @@ class OpenCVCamera:
                    "To find the camera index you should use, run `python lerobot/common/robot_devices/cameras/opencv.py`."
                )

-            raise OSError(f"Can't access OpenCVCamera({self.camera_index}).")
+            raise OSError(f"Can't access OpenCVCamera({camera_idx}).")

        # Secondly, create the camera that will be used downstream.
        # Note: For some unknown reason, calling `isOpened` blocks the camera which then
        # needs to be re-created.
-        if platform.system() == "Linux":
-            self.camera = cv2.VideoCapture(f"/dev/video{self.camera_index}")
-        else:
-            self.camera = cv2.VideoCapture(self.camera_index)
+        self.camera = VideoCapture(camera_idx)

        if self.fps is not None:
-            self.camera.set(cv2.CAP_PROP_FPS, self.fps)
+            self.camera.set(CAP_PROP_FPS, self.fps)
        if self.width is not None:
-            self.camera.set(cv2.CAP_PROP_FRAME_WIDTH, self.width)
+            self.camera.set(CAP_PROP_FRAME_WIDTH, self.width)
        if self.height is not None:
-            self.camera.set(cv2.CAP_PROP_FRAME_HEIGHT, self.height)
+            self.camera.set(CAP_PROP_FRAME_HEIGHT, self.height)

-        actual_fps = self.camera.get(cv2.CAP_PROP_FPS)
-        actual_width = self.camera.get(cv2.CAP_PROP_FRAME_WIDTH)
-        actual_height = self.camera.get(cv2.CAP_PROP_FRAME_HEIGHT)
+        actual_fps = self.camera.get(CAP_PROP_FPS)
+        actual_width = self.camera.get(CAP_PROP_FRAME_WIDTH)
+        actual_height = self.camera.get(CAP_PROP_FRAME_HEIGHT)

+        # Using `math.isclose` since actual fps can be a float (e.g. 29.9 instead of 30)
        if self.fps is not None and not math.isclose(self.fps, actual_fps, rel_tol=1e-3):
+            # Using `OSError` since it's a broad that encompasses issues related to device communication
            raise OSError(
                f"Can't set {self.fps=} for OpenCVCamera({self.camera_index}). Actual value is {actual_fps}."
            )
@@ -285,9 +308,9 @@ class OpenCVCamera:
                f"Can't set {self.height=} for OpenCVCamera({self.camera_index}). Actual value is {actual_height}."
            )

-        self.fps = actual_fps
-        self.width = actual_width
-        self.height = actual_height
+        self.fps = round(actual_fps)
+        self.width = round(actual_width)
+        self.height = round(actual_height)

        self.is_connected = True

@@ -306,6 +329,7 @@ class OpenCVCamera:
        start_time = time.perf_counter()

        ret, color_image = self.camera.read()
+
        if not ret:
            raise OSError(f"Can't capture color image from camera {self.camera_index}.")

@@ -320,7 +344,12 @@ class OpenCVCamera:
        # However, Deep Learning framework such as LeRobot uses RGB format as default to train neural networks,
        # so we convert the image color from BGR to RGB.
        if requested_color_mode == "rgb":
-            color_image = cv2.cvtColor(color_image, cv2.COLOR_BGR2RGB)
+            if self.mock:
+                from tests.mock_cv2 import COLOR_BGR2RGB, cvtColor
+            else:
+                from cv2 import COLOR_BGR2RGB, cvtColor
+
+            color_image = cvtColor(color_image, COLOR_BGR2RGB)

        h, w, _ = color_image.shape
        if h != self.height or w != self.width:
@@ -334,11 +363,16 @@ class OpenCVCamera:
        # log the utc time at which the image was received
        self.logs["timestamp_utc"] = capture_timestamp_utc()

+        self.color_image = color_image
+
        return color_image

    def read_loop(self):
-        while self.stop_event is None or not self.stop_event.is_set():
-            self.color_image = self.read()
+        while not self.stop_event.is_set():
+            try:
+                self.color_image = self.read()
+            except Exception as e:
+                print(f"Error reading in thread: {e}")

    def async_read(self):
        if not self.is_connected:
@@ -353,15 +387,14 @@ class OpenCVCamera:
            self.thread.start()

        num_tries = 0
-        while self.color_image is None:
-            num_tries += 1
-            time.sleep(1 / self.fps)
-            if num_tries > self.fps and (self.thread.ident is None or not self.thread.is_alive()):
-                raise Exception(
-                    "The thread responsible for `self.async_read()` took too much time to start. There might be an issue. Verify that `self.thread.start()` has been called."
-                )
+        while True:
+            if self.color_image is not None:
+                return self.color_image

-        return self.color_image
+            time.sleep(1 / self.fps)
+            num_tries += 1
+            if num_tries > self.fps * 2:
+                raise TimeoutError("Timed out waiting for async_read() to start.")

    def disconnect(self):
        if not self.is_connected:
@@ -369,16 +402,14 @@ class OpenCVCamera:
                f"OpenCVCamera({self.camera_index}) is not connected. Try running `camera.connect()` first."
            )

-        if self.thread is not None and self.thread.is_alive():
-            # wait for the thread to finish
+        if self.thread is not None:
            self.stop_event.set()
-            self.thread.join()
+            self.thread.join()  # wait for the thread to finish
            self.thread = None
            self.stop_event = None

        self.camera.release()
        self.camera = None
-
        self.is_connected = False

    def __del__(self):