Optimize processing pipeline and fix multi-target crash

Performance optimizations across 5 phases: - Saturation filter: float32 → int32 integer math (~2-3x faster) - Frame interpolation: pre-allocated uint16 scratch buffers - Color correction: single-pass cv2.LUT instead of 3 channel lookups - DDP: numpy vectorized color reorder + pre-allocated RGBW buffer - Calibration boundaries: vectorized with np.arange + np.maximum - wled_client: vectorized pixel validation and HTTP pixel list - _fit_to_device: cached linspace arrays (now per-instance) - Diagnostic lists: bounded deque(maxlen=...) instead of unbounded list - Health checks: adaptive intervals (10s streaming, 60s idle) - Profile engine: poll interval 3s → 1s Bug fixes: - Fix deque slicing crash killing targets when multiple run in parallel (deque doesn't support [-1:] or [:5] slice syntax unlike list) - Fix numpy array boolean ambiguity in send_pixels() validation - Persist fatal processing loop errors to metrics for API visibility - Move _fit_to_device cache from class-level to instance-level to prevent cross-target cache thrashing Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-02-26 21:28:17 +03:00
parent fda040ae18
commit 6f5bda6d8f
9 changed files with 135 additions and 92 deletions
--- a/server/src/wled_controller/core/devices/ddp_client.py
+++ b/server/src/wled_controller/core/devices/ddp_client.py
@@ -52,6 +52,9 @@ class DDPClient:
        self._protocol = None
        self._sequence = 0
        self._buses: List[BusConfig] = []
+        # Pre-allocated RGBW buffer (resized on demand)
+        self._rgbw_buf: Optional[np.ndarray] = None
+        self._rgbw_buf_n: int = 0

    async def connect(self):
        """Establish UDP connection."""
@@ -136,26 +139,23 @@ class DDPClient:

        return header + rgb_data

-    def _reorder_pixels(
-        self,
-        pixels: List[Tuple[int, int, int]],
-    ) -> List[Tuple[int, int, int]]:
-        """Apply per-bus color order reordering.
+    def _reorder_pixels_numpy(self, pixel_array: np.ndarray) -> np.ndarray:
+        """Apply per-bus color order reordering using numpy fancy indexing.

        WLED may not apply per-bus color order conversion for DDP data on
        all buses (observed in multi-bus setups). We reorder pixel channels
        here so the hardware receives the correct byte order directly.

        Args:
-            pixels: List of (R, G, B) tuples in standard RGB order
+            pixel_array: (N, 3) uint8 numpy array in RGB order

        Returns:
-            List of reordered tuples matching each bus's hardware color order
+            Reordered array (may be a view or copy depending on buses)
        """
        if not self._buses:
-            return pixels
+            return pixel_array

-        result = list(pixels)
+        result = pixel_array.copy()
        for bus in self._buses:
            order_map = COLOR_ORDER_MAP.get(bus.color_order)
            if not order_map or order_map == (0, 1, 2):
@@ -163,10 +163,7 @@ class DDPClient:

            start = bus.start
            end = min(bus.start + bus.length, len(result))
-            for i in range(start, end):
-                r, g, b = result[i]
-                rgb = (r, g, b)
-                result[i] = (rgb[order_map[0]], rgb[order_map[1]], rgb[order_map[2]])
+            result[start:end] = result[start:end][:, order_map]

        return result

@@ -197,8 +194,12 @@ class DDPClient:
            bpp = 4 if self.rgbw else 3  # bytes per pixel
            pixel_array = np.array(pixels, dtype=np.uint8)
            if self.rgbw:
-                white = np.zeros((pixel_array.shape[0], 1), dtype=np.uint8)
-                pixel_array = np.hstack((pixel_array, white))
+                n = pixel_array.shape[0]
+                if n != self._rgbw_buf_n:
+                    self._rgbw_buf = np.zeros((n, 4), dtype=np.uint8)
+                    self._rgbw_buf_n = n
+                self._rgbw_buf[:, :3] = pixel_array
+                pixel_array = self._rgbw_buf
            pixel_bytes = pixel_array.tobytes()

            total_bytes = len(pixel_bytes)
@@ -256,10 +257,14 @@ class DDPClient:
        if not self._transport:
            raise RuntimeError("DDP client not connected")

-        # Handle RGBW: insert zero white channel column
+        # Handle RGBW: copy RGB into pre-allocated (N, 4) buffer
        if self.rgbw:
-            white = np.zeros((pixel_array.shape[0], 1), dtype=np.uint8)
-            pixel_array = np.hstack((pixel_array, white))
+            n = pixel_array.shape[0]
+            if n != self._rgbw_buf_n:
+                self._rgbw_buf = np.zeros((n, 4), dtype=np.uint8)
+                self._rgbw_buf_n = n
+            self._rgbw_buf[:, :3] = pixel_array
+            pixel_array = self._rgbw_buf

        pixel_bytes = pixel_array.tobytes()

--- a/server/src/wled_controller/core/devices/wled_client.py
+++ b/server/src/wled_controller/core/devices/wled_client.py
@@ -333,18 +333,25 @@ class WLEDClient(LEDClient):
            RuntimeError: If request fails
        """
        # Validate inputs
-        if not pixels:
-            raise ValueError("Pixels list cannot be empty")
+        if isinstance(pixels, np.ndarray):
+            if pixels.size == 0:
+                raise ValueError("Pixels array cannot be empty")
+            pixel_arr = pixels
+        else:
+            if not pixels:
+                raise ValueError("Pixels list cannot be empty")
+            pixel_arr = np.array(pixels, dtype=np.int16)

        if not 0 <= brightness <= 255:
            raise ValueError(f"Brightness must be 0-255, got {brightness}")

-        # Validate pixel values
-        validated_pixels = []
-        for i, (r, g, b) in enumerate(pixels):
-            if not (0 <= r <= 255 and 0 <= g <= 255 and 0 <= b <= 255):
-                raise ValueError(f"Invalid RGB values at index {i}: ({r}, {g}, {b})")
-            validated_pixels.append((int(r), int(g), int(b)))
+        # Validate pixel values using vectorized bounds check
+        if pixel_arr.dtype != np.uint8:
+            if np.any((pixel_arr < 0) | (pixel_arr > 255)):
+                bad_mask = np.any((pixel_arr < 0) | (pixel_arr > 255), axis=1)
+                idx = int(np.argmax(bad_mask))
+                raise ValueError(f"Invalid RGB values at index {idx}: {tuple(pixel_arr[idx])}")
+        validated_pixels = pixel_arr.astype(np.uint8) if pixel_arr.dtype != np.uint8 else pixel_arr

        # Use DDP protocol if enabled
        if self.use_ddp and self._ddp_client:
@@ -354,33 +361,24 @@ class WLEDClient(LEDClient):

    async def _send_pixels_ddp(
        self,
-        pixels: List[Tuple[int, int, int]],
+        pixels: np.ndarray,
        brightness: int = 255,
    ) -> bool:
        """Send pixels via DDP protocol.

        Args:
-            pixels: List of (R, G, B) tuples
+            pixels: (N, 3) uint8 numpy array of RGB values
            brightness: Global brightness (0-255)

        Returns:
            True if successful
        """
        try:
-            # Apply brightness to pixels
            if brightness < 255:
-                brightness_factor = brightness / 255.0
-                pixels = [
-                    (
-                        int(r * brightness_factor),
-                        int(g * brightness_factor),
-                        int(b * brightness_factor)
-                    )
-                    for r, g, b in pixels
-                ]
+                pixels = (pixels.astype(np.uint16) * brightness >> 8).astype(np.uint8)

            logger.debug(f"Sending {len(pixels)} LEDs via DDP")
-            await self._ddp_client.send_pixels(pixels)
+            self._ddp_client.send_pixels_numpy(pixels)
            logger.debug(f"Successfully sent pixel colors via DDP")
            return True

@@ -390,14 +388,14 @@ class WLEDClient(LEDClient):

    async def _send_pixels_http(
        self,
-        pixels: List[Tuple[int, int, int]],
+        pixels: np.ndarray,
        brightness: int = 255,
        segment_id: int = 0,
    ) -> bool:
        """Send pixels via HTTP JSON API.

        Args:
-            pixels: List of (R, G, B) tuples
+            pixels: (N, 3) uint8 numpy array of RGB values
            brightness: Global brightness (0-255)
            segment_id: Segment ID to update

@@ -406,9 +404,8 @@ class WLEDClient(LEDClient):
        """
        try:
            # Build indexed pixel array: [led_index, r, g, b, ...]
-            indexed_pixels = []
-            for i, (r, g, b) in enumerate(pixels):
-                indexed_pixels.extend([i, int(r), int(g), int(b)])
+            indices = np.arange(len(pixels), dtype=np.int32).reshape(-1, 1)
+            indexed_pixels = np.hstack([indices, pixels.astype(np.int32)]).ravel().tolist()

            # Build WLED JSON state
            payload = {