feat: Add video playback functionality and inference support
- Introduced VideoPlayer class to handle local video playback, emitting frames via frame_ready signal. - Updated MainWindow to switch between camera and video sources, integrating video playback controls. - Enhanced AppMenuBar with options to open video files and manage inference models. - Implemented BboxOverlay for displaying detection results on video frames. - Added InferenceManager to manage YOLO inference in a separate process, with error handling and restart logic. - Created tests for BboxOverlay and InferenceManager to ensure functionality and robustness. - Updated pyproject.toml to include optional dependencies for inference support.
This commit is contained in:
0
app/inference/__init__.py
Normal file
0
app/inference/__init__.py
Normal file
154
app/inference/bbox_overlay.py
Normal file
154
app/inference/bbox_overlay.py
Normal file
@@ -0,0 +1,154 @@
|
||||
"""BboxOverlay — draws YOLO detection bounding boxes on the camera view."""
|
||||
|
||||
from __future__ import annotations
|
||||
|
||||
import logging
|
||||
from typing import NamedTuple
|
||||
|
||||
from PySide6.QtCore import QRect, QSize, Qt, Slot
|
||||
from PySide6.QtGui import QColor, QFont, QPainter, QPen
|
||||
|
||||
from app.config import (
|
||||
BBOX_COLOR,
|
||||
BBOX_FONT_SIZE,
|
||||
BBOX_LABEL_BG_COLOR,
|
||||
BBOX_LABEL_TEXT_COLOR,
|
||||
BBOX_LINE_WIDTH,
|
||||
)
|
||||
from app.overlay.overlay_layer import IOverlayLayer
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
|
||||
class Detection(NamedTuple):
|
||||
"""
|
||||
A single object detection result.
|
||||
|
||||
Coordinates (x1, y1, x2, y2) are in pixels of the *source frame*
|
||||
(i.e. the frame that was submitted to inference). BboxOverlay maps
|
||||
them to the letterboxed video_rect before drawing.
|
||||
"""
|
||||
|
||||
x1: float
|
||||
y1: float
|
||||
x2: float
|
||||
y2: float
|
||||
conf: float
|
||||
label: str
|
||||
|
||||
|
||||
class BboxOverlay(IOverlayLayer):
|
||||
"""
|
||||
Overlay layer that renders detection bounding boxes.
|
||||
|
||||
Usage:
|
||||
overlay = BboxOverlay()
|
||||
camera_view.add_overlay_layer(overlay)
|
||||
inference_manager.detections_ready.connect(overlay.on_detections)
|
||||
|
||||
Thread safety:
|
||||
on_detections() is called from the GUI thread (via Qt signal).
|
||||
paint() is also called from the GUI thread (paintEvent).
|
||||
No locks required.
|
||||
"""
|
||||
|
||||
def __init__(self) -> None:
|
||||
super().__init__()
|
||||
self._detections: list[Detection] = []
|
||||
self._source_size: QSize = QSize(0, 0)
|
||||
|
||||
self._pen = QPen(QColor(*BBOX_COLOR))
|
||||
self._pen.setWidth(BBOX_LINE_WIDTH)
|
||||
self._pen.setJoinStyle(Qt.PenJoinStyle.MiterJoin)
|
||||
|
||||
self._font = QFont("Monospace")
|
||||
self._font.setStyleHint(QFont.StyleHint.TypeWriter)
|
||||
self._font.setPointSize(BBOX_FONT_SIZE)
|
||||
self._font.setBold(True)
|
||||
|
||||
self._box_color = QColor(*BBOX_COLOR)
|
||||
self._bg_color = QColor(*BBOX_LABEL_BG_COLOR)
|
||||
self._text_color = QColor(*BBOX_LABEL_TEXT_COLOR)
|
||||
|
||||
# ------------------------------------------------------------------
|
||||
# Public API
|
||||
# ------------------------------------------------------------------
|
||||
|
||||
@Slot(object, object)
|
||||
def on_detections(
|
||||
self,
|
||||
detections: list[Detection],
|
||||
source_size: tuple[int, int],
|
||||
) -> None:
|
||||
"""
|
||||
Receive detection results from InferenceManager.
|
||||
|
||||
Args:
|
||||
detections: List of Detection namedtuples (pixel coords).
|
||||
source_size: (width, height) of the frame that was inferred.
|
||||
"""
|
||||
self._detections = detections
|
||||
self._source_size = QSize(*source_size)
|
||||
|
||||
def clear(self) -> None:
|
||||
"""Remove all currently displayed detections."""
|
||||
self._detections = []
|
||||
|
||||
# ------------------------------------------------------------------
|
||||
# IOverlayLayer implementation
|
||||
# ------------------------------------------------------------------
|
||||
|
||||
def paint(self, painter: QPainter, video_rect: QRect) -> None:
|
||||
if not self._detections:
|
||||
return
|
||||
if self._source_size.isEmpty():
|
||||
return
|
||||
|
||||
src_w = self._source_size.width()
|
||||
src_h = self._source_size.height()
|
||||
vr = video_rect
|
||||
|
||||
# Scale factors: source-pixel → video_rect-pixel
|
||||
scale_x = vr.width() / src_w
|
||||
scale_y = vr.height() / src_h
|
||||
|
||||
painter.setFont(self._font)
|
||||
fm = painter.fontMetrics()
|
||||
|
||||
for det in self._detections:
|
||||
# Map to widget coordinates
|
||||
wx1 = vr.x() + int(det.x1 * scale_x)
|
||||
wy1 = vr.y() + int(det.y1 * scale_y)
|
||||
wx2 = vr.x() + int(det.x2 * scale_x)
|
||||
wy2 = vr.y() + int(det.y2 * scale_y)
|
||||
|
||||
box_rect = QRect(wx1, wy1, wx2 - wx1, wy2 - wy1)
|
||||
|
||||
# Draw bounding box
|
||||
painter.setPen(self._pen)
|
||||
painter.setBrush(Qt.BrushStyle.NoBrush)
|
||||
painter.drawRect(box_rect)
|
||||
|
||||
# Label text: "label 0.87"
|
||||
label_text = f"{det.label} {det.conf:.2f}"
|
||||
text_w = fm.horizontalAdvance(label_text) + 6
|
||||
text_h = fm.height() + 2
|
||||
|
||||
# Position label above box, clamped to video_rect
|
||||
lx = wx1
|
||||
ly = wy1 - text_h
|
||||
if ly < vr.top():
|
||||
ly = wy1 # draw inside box if no room above
|
||||
|
||||
label_bg = QRect(lx, ly, text_w, text_h)
|
||||
|
||||
painter.setPen(Qt.PenStyle.NoPen)
|
||||
painter.setBrush(self._bg_color)
|
||||
painter.drawRect(label_bg)
|
||||
|
||||
painter.setPen(QPen(self._text_color))
|
||||
painter.drawText(
|
||||
lx + 3,
|
||||
ly + fm.ascent() + 1,
|
||||
label_text,
|
||||
)
|
||||
196
app/inference/worker.py
Normal file
196
app/inference/worker.py
Normal file
@@ -0,0 +1,196 @@
|
||||
"""YOLO inference worker — runs in a separate process.
|
||||
|
||||
This module contains only plain functions (no Qt, no PySide6) so it can
|
||||
safely be imported and executed in a child process via multiprocessing.
|
||||
|
||||
IPC protocol
|
||||
------------
|
||||
input_queue receives : FramePacket (frame_id, raw_bytes, width, height, channels)
|
||||
output_queue sends : ResultPacket (frame_id, detections, width, height)
|
||||
stop_event : multiprocessing.Event — set by parent to request clean exit
|
||||
|
||||
Detection format (namedtuple-compatible plain tuple):
|
||||
(x1, y1, x2, y2, conf, label) — all floats/str, x/y in source-frame pixels
|
||||
"""
|
||||
|
||||
from __future__ import annotations
|
||||
|
||||
import logging
|
||||
import platform
|
||||
import sys
|
||||
from multiprocessing import Event, Queue
|
||||
from queue import Empty
|
||||
from typing import NamedTuple
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# Data structures shared between worker and manager
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
class FramePacket(NamedTuple):
|
||||
frame_id: int
|
||||
raw_bytes: bytes # RGB bytes, row-major, shape = (height, width, channels)
|
||||
width: int
|
||||
height: int
|
||||
channels: int # always 3 (RGB)
|
||||
|
||||
|
||||
class ResultPacket(NamedTuple):
|
||||
frame_id: int
|
||||
detections: list # list of (x1, y1, x2, y2, conf, label) tuples
|
||||
width: int # source frame width (for overlay scaling)
|
||||
height: int # source frame height
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# Worker entry point
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
def run_worker(
|
||||
model_path: str,
|
||||
input_queue: Queue,
|
||||
output_queue: Queue,
|
||||
stop_event: Event,
|
||||
log_level: int = logging.WARNING,
|
||||
) -> None:
|
||||
"""
|
||||
Main loop of the inference worker process.
|
||||
|
||||
Loads the YOLO model once, then processes frames from input_queue
|
||||
until stop_event is set. Results are posted to output_queue.
|
||||
|
||||
This function is designed to be the target of multiprocessing.Process.
|
||||
It must NOT import PySide6 or any Qt module.
|
||||
"""
|
||||
_configure_worker_logging(log_level)
|
||||
logger.info("Inference worker starting (pid=%d)", _getpid())
|
||||
|
||||
try:
|
||||
model = _load_model(model_path)
|
||||
except Exception as exc:
|
||||
logger.error("Failed to load model '%s': %s", model_path, exc)
|
||||
# Signal failure by putting None — manager treats it as error
|
||||
output_queue.put(None)
|
||||
return
|
||||
|
||||
logger.info("Model loaded: %s", model_path)
|
||||
|
||||
while not stop_event.is_set():
|
||||
try:
|
||||
packet: FramePacket = input_queue.get(timeout=0.1)
|
||||
except Empty:
|
||||
continue
|
||||
except Exception as exc:
|
||||
logger.error("Error reading input queue: %s", exc)
|
||||
break
|
||||
|
||||
try:
|
||||
result = _infer(model, packet)
|
||||
output_queue.put(result)
|
||||
except Exception as exc:
|
||||
logger.error("Inference error (frame %d): %s", packet.frame_id, exc)
|
||||
# Put empty result so manager knows we're still alive
|
||||
output_queue.put(ResultPacket(
|
||||
frame_id=packet.frame_id,
|
||||
detections=[],
|
||||
width=packet.width,
|
||||
height=packet.height,
|
||||
))
|
||||
|
||||
logger.info("Inference worker stopping")
|
||||
|
||||
|
||||
# ---------------------------------------------------------------------------
|
||||
# Helpers
|
||||
# ---------------------------------------------------------------------------
|
||||
|
||||
def _load_model(model_path: str):
|
||||
"""Load YOLO model with best available device."""
|
||||
from ultralytics import YOLO # noqa: PLC0415
|
||||
|
||||
device = _select_device()
|
||||
logger.info("Loading YOLO model on device='%s'", device)
|
||||
model = YOLO(model_path)
|
||||
# Warm up — run on a tiny dummy to JIT-compile kernels
|
||||
try:
|
||||
import numpy as np # noqa: PLC0415
|
||||
dummy = np.zeros((64, 64, 3), dtype=np.uint8)
|
||||
model(dummy, device=device, verbose=False)
|
||||
except Exception as exc:
|
||||
logger.warning("Warm-up failed (non-fatal): %s", exc)
|
||||
return model
|
||||
|
||||
|
||||
def _select_device() -> str:
|
||||
"""
|
||||
Choose inference device.
|
||||
|
||||
Priority:
|
||||
- macOS → "mps" if available (Metal GPU), else "cpu"
|
||||
- others → "cpu"
|
||||
"""
|
||||
system = platform.system()
|
||||
if system == "Darwin":
|
||||
try:
|
||||
import torch # noqa: PLC0415
|
||||
if torch.backends.mps.is_available():
|
||||
logger.info("MPS (Metal) available — using GPU")
|
||||
return "mps"
|
||||
except Exception:
|
||||
pass
|
||||
logger.info("MPS not available — using CPU")
|
||||
return "cpu"
|
||||
|
||||
|
||||
def _infer(model, packet: FramePacket) -> ResultPacket:
|
||||
"""Run model on one frame, return ResultPacket."""
|
||||
import numpy as np # noqa: PLC0415
|
||||
|
||||
frame_np = np.frombuffer(packet.raw_bytes, dtype=np.uint8).reshape(
|
||||
(packet.height, packet.width, packet.channels)
|
||||
)
|
||||
|
||||
device = _select_device()
|
||||
results = model(frame_np, device=device, verbose=False)
|
||||
|
||||
detections = []
|
||||
for r in results:
|
||||
if r.boxes is None:
|
||||
continue
|
||||
boxes = r.boxes
|
||||
for i in range(len(boxes)):
|
||||
xyxy = boxes.xyxy[i].tolist() # [x1, y1, x2, y2] in source pixels
|
||||
conf = float(boxes.conf[i])
|
||||
cls_idx = int(boxes.cls[i])
|
||||
label = (
|
||||
r.names[cls_idx]
|
||||
if r.names and cls_idx in r.names
|
||||
else str(cls_idx)
|
||||
)
|
||||
detections.append((
|
||||
float(xyxy[0]), float(xyxy[1]),
|
||||
float(xyxy[2]), float(xyxy[3]),
|
||||
conf, label,
|
||||
))
|
||||
|
||||
return ResultPacket(
|
||||
frame_id=packet.frame_id,
|
||||
detections=detections,
|
||||
width=packet.width,
|
||||
height=packet.height,
|
||||
)
|
||||
|
||||
|
||||
def _configure_worker_logging(level: int) -> None:
|
||||
logging.basicConfig(
|
||||
level=level,
|
||||
format="[worker %(process)d] %(levelname)s %(name)s: %(message)s",
|
||||
stream=sys.stderr,
|
||||
)
|
||||
|
||||
|
||||
def _getpid() -> int:
|
||||
import os # noqa: PLC0415
|
||||
return os.getpid()
|
||||
350
app/inference/worker_manager.py
Normal file
350
app/inference/worker_manager.py
Normal file
@@ -0,0 +1,350 @@
|
||||
"""InferenceManager — orchestrates the YOLO worker process from the GUI thread.
|
||||
|
||||
Responsibilities:
|
||||
- Start / stop the worker process
|
||||
- Submit frames (with drop-if-busy logic)
|
||||
- Poll result queue via QTimer (never blocks the GUI thread)
|
||||
- Watch process health via QTimer (auto-restart on crash)
|
||||
- Emit Qt signals with results for BboxOverlay
|
||||
"""
|
||||
|
||||
from __future__ import annotations
|
||||
|
||||
import logging
|
||||
import multiprocessing
|
||||
import time
|
||||
from pathlib import Path
|
||||
|
||||
from PySide6.QtCore import QObject, QTimer, Signal, Slot
|
||||
from PySide6.QtMultimedia import QVideoFrame
|
||||
|
||||
from app.config import (
|
||||
INFERENCE_MAX_RESTARTS,
|
||||
INFERENCE_POLL_INTERVAL_MS,
|
||||
INFERENCE_WATCHDOG_INTERVAL_MS,
|
||||
INFERENCE_WORKER_TIMEOUT_S,
|
||||
)
|
||||
from app.inference.bbox_overlay import Detection
|
||||
from app.inference.worker import FramePacket, ResultPacket, run_worker
|
||||
|
||||
logger = logging.getLogger(__name__)
|
||||
|
||||
|
||||
class InferenceManager(QObject):
|
||||
"""
|
||||
Manages the YOLO worker subprocess.
|
||||
|
||||
Signals:
|
||||
detections_ready(detections, source_size)
|
||||
Emitted in the GUI thread when a result arrives.
|
||||
detections : list[Detection]
|
||||
source_size : tuple[int, int] — (width, height) of inferred frame
|
||||
|
||||
inference_started() — worker is up and model is loaded
|
||||
inference_stopped() — worker has exited cleanly
|
||||
inference_error(str) — fatal error (max restarts exceeded)
|
||||
|
||||
Usage:
|
||||
mgr = InferenceManager(parent=self)
|
||||
mgr.detections_ready.connect(bbox_overlay.on_detections)
|
||||
mgr.start("path/to/model.pt")
|
||||
# ...
|
||||
mgr.submit_frame(video_frame) # called by FrameDispatcher subscriber
|
||||
# ...
|
||||
mgr.stop()
|
||||
"""
|
||||
|
||||
detections_ready = Signal(object, object) # list[Detection], tuple[int,int]
|
||||
inference_started = Signal()
|
||||
inference_stopped = Signal()
|
||||
inference_error = Signal(str)
|
||||
|
||||
def __init__(self, parent: QObject | None = None) -> None:
|
||||
super().__init__(parent)
|
||||
|
||||
self._model_path: str | None = None
|
||||
self._process: multiprocessing.Process | None = None
|
||||
self._input_queue: multiprocessing.Queue | None = None
|
||||
self._output_queue: multiprocessing.Queue | None = None
|
||||
self._stop_event: multiprocessing.Event | None = None
|
||||
|
||||
# Drop-if-busy flag — True while worker is processing a frame
|
||||
self._busy: bool = False
|
||||
self._frame_id: int = 0
|
||||
|
||||
# Restart tracking
|
||||
self._restart_count: int = 0
|
||||
self._last_result_time: float = 0.0
|
||||
|
||||
# Paused flag — inference can be suspended without stopping the process
|
||||
self._paused: bool = False
|
||||
|
||||
# QTimers (GUI thread)
|
||||
self._poll_timer = QTimer(self)
|
||||
self._poll_timer.setInterval(INFERENCE_POLL_INTERVAL_MS)
|
||||
self._poll_timer.timeout.connect(self._poll_output)
|
||||
|
||||
self._watchdog_timer = QTimer(self)
|
||||
self._watchdog_timer.setInterval(INFERENCE_WATCHDOG_INTERVAL_MS)
|
||||
self._watchdog_timer.timeout.connect(self._watchdog_check)
|
||||
|
||||
# ------------------------------------------------------------------
|
||||
# Public API
|
||||
# ------------------------------------------------------------------
|
||||
|
||||
def start(self, model_path: str) -> None:
|
||||
"""Load model and start the worker process."""
|
||||
if not Path(model_path).exists():
|
||||
msg = f"Model file not found: {model_path}"
|
||||
logger.error(msg)
|
||||
self.inference_error.emit(msg)
|
||||
return
|
||||
|
||||
self._stop_worker()
|
||||
self._model_path = model_path
|
||||
self._restart_count = 0
|
||||
self._paused = False
|
||||
self._start_worker()
|
||||
|
||||
def stop(self) -> None:
|
||||
"""Stop the worker process and reset state."""
|
||||
self._stop_worker()
|
||||
self._model_path = None
|
||||
self._restart_count = 0
|
||||
self._paused = False
|
||||
|
||||
def pause(self) -> None:
|
||||
"""Suspend frame submission without stopping the process."""
|
||||
self._paused = True
|
||||
logger.debug("InferenceManager: paused")
|
||||
|
||||
def resume(self) -> None:
|
||||
"""Resume frame submission."""
|
||||
self._paused = False
|
||||
logger.debug("InferenceManager: resumed")
|
||||
|
||||
@property
|
||||
def is_running(self) -> bool:
|
||||
return self._process is not None and self._process.is_alive()
|
||||
|
||||
@property
|
||||
def is_paused(self) -> bool:
|
||||
return self._paused
|
||||
|
||||
@property
|
||||
def model_path(self) -> str | None:
|
||||
return self._model_path
|
||||
|
||||
@Slot(QVideoFrame)
|
||||
def submit_frame(self, frame: QVideoFrame) -> None:
|
||||
"""
|
||||
Attempt to submit a frame for inference.
|
||||
|
||||
Drops the frame silently if:
|
||||
- manager is not running
|
||||
- manager is paused
|
||||
- worker is still busy with previous frame (drop_if_busy)
|
||||
"""
|
||||
if not self.is_running or self._paused or self._busy:
|
||||
return
|
||||
|
||||
if not frame.isValid():
|
||||
return
|
||||
|
||||
# Map frame to read-only memory, copy raw bytes, unmap
|
||||
if not frame.map(QVideoFrame.MapMode.ReadOnly):
|
||||
logger.warning("InferenceManager: failed to map QVideoFrame")
|
||||
return
|
||||
|
||||
try:
|
||||
width = frame.width()
|
||||
height = frame.height()
|
||||
raw = bytes(frame.bits(0)) # plane 0 — copies data
|
||||
finally:
|
||||
frame.unmap()
|
||||
|
||||
if not raw:
|
||||
return
|
||||
|
||||
# Detect number of channels from byte count
|
||||
expected_rgb = width * height * 3
|
||||
expected_rgba = width * height * 4
|
||||
if len(raw) >= expected_rgba:
|
||||
# BGRA / RGBA — convert to RGB by stripping alpha and swapping B/R
|
||||
try:
|
||||
import numpy as np # noqa: PLC0415
|
||||
arr = np.frombuffer(raw, dtype=np.uint8).reshape((height, width, 4))
|
||||
# Qt delivers BGRA → swap to RGB
|
||||
rgb = arr[:, :, [2, 1, 0]].copy()
|
||||
raw = rgb.tobytes()
|
||||
channels = 3
|
||||
except Exception as exc:
|
||||
logger.warning("Frame colour conversion failed: %s", exc)
|
||||
return
|
||||
elif len(raw) >= expected_rgb:
|
||||
channels = 3
|
||||
else:
|
||||
logger.warning(
|
||||
"Unexpected frame size: %d bytes for %dx%d",
|
||||
len(raw), width, height,
|
||||
)
|
||||
return
|
||||
|
||||
self._frame_id += 1
|
||||
packet = FramePacket(
|
||||
frame_id=self._frame_id,
|
||||
raw_bytes=raw,
|
||||
width=width,
|
||||
height=height,
|
||||
channels=channels,
|
||||
)
|
||||
|
||||
try:
|
||||
self._input_queue.put_nowait(packet)
|
||||
self._busy = True
|
||||
logger.debug("InferenceManager: submitted frame %d", self._frame_id)
|
||||
except Exception as exc:
|
||||
logger.warning("InferenceManager: could not enqueue frame: %s", exc)
|
||||
|
||||
# ------------------------------------------------------------------
|
||||
# Private — worker lifecycle
|
||||
# ------------------------------------------------------------------
|
||||
|
||||
def _start_worker(self) -> None:
|
||||
ctx = multiprocessing.get_context("spawn")
|
||||
self._input_queue = ctx.Queue(maxsize=1)
|
||||
self._output_queue = ctx.Queue(maxsize=4)
|
||||
self._stop_event = ctx.Event()
|
||||
|
||||
self._process = ctx.Process(
|
||||
target=run_worker,
|
||||
args=(
|
||||
self._model_path,
|
||||
self._input_queue,
|
||||
self._output_queue,
|
||||
self._stop_event,
|
||||
logging.WARNING,
|
||||
),
|
||||
daemon=True,
|
||||
name="inference-worker",
|
||||
)
|
||||
self._process.start()
|
||||
self._busy = False
|
||||
self._last_result_time = time.monotonic()
|
||||
|
||||
self._poll_timer.start()
|
||||
self._watchdog_timer.start()
|
||||
logger.info(
|
||||
"Inference worker started (pid=%d, model=%s)",
|
||||
self._process.pid, self._model_path,
|
||||
)
|
||||
self.inference_started.emit()
|
||||
|
||||
def _stop_worker(self) -> None:
|
||||
self._poll_timer.stop()
|
||||
self._watchdog_timer.stop()
|
||||
|
||||
if self._stop_event is not None:
|
||||
self._stop_event.set()
|
||||
|
||||
if self._process is not None:
|
||||
self._process.join(timeout=3.0)
|
||||
if self._process.is_alive():
|
||||
logger.warning("Worker did not stop cleanly — terminating")
|
||||
self._process.terminate()
|
||||
self._process.join(timeout=2.0)
|
||||
self._process = None
|
||||
|
||||
self._input_queue = None
|
||||
self._output_queue = None
|
||||
self._stop_event = None
|
||||
self._busy = False
|
||||
|
||||
logger.info("Inference worker stopped")
|
||||
self.inference_stopped.emit()
|
||||
|
||||
# ------------------------------------------------------------------
|
||||
# Private — timers
|
||||
# ------------------------------------------------------------------
|
||||
|
||||
@Slot()
|
||||
def _poll_output(self) -> None:
|
||||
"""Drain the output queue (called every INFERENCE_POLL_INTERVAL_MS ms)."""
|
||||
if self._output_queue is None:
|
||||
return
|
||||
|
||||
try:
|
||||
while True:
|
||||
item = self._output_queue.get_nowait()
|
||||
if item is None:
|
||||
# Worker signalled a fatal load error
|
||||
logger.error("Worker reported model load failure")
|
||||
self._handle_crash("Model failed to load in worker process")
|
||||
return
|
||||
|
||||
packet: ResultPacket = item
|
||||
self._busy = False
|
||||
self._last_result_time = time.monotonic()
|
||||
|
||||
detections = [
|
||||
Detection(x1, y1, x2, y2, conf, label)
|
||||
for x1, y1, x2, y2, conf, label in packet.detections
|
||||
]
|
||||
source_size = (packet.width, packet.height)
|
||||
|
||||
logger.debug(
|
||||
"InferenceManager: frame %d → %d detections",
|
||||
packet.frame_id, len(detections),
|
||||
)
|
||||
self.detections_ready.emit(detections, source_size)
|
||||
|
||||
except Exception:
|
||||
# Empty queue — normal
|
||||
pass
|
||||
|
||||
@Slot()
|
||||
def _watchdog_check(self) -> None:
|
||||
"""Detect crashed or hung worker process."""
|
||||
if self._process is None:
|
||||
return
|
||||
|
||||
# Process died unexpectedly
|
||||
if not self._process.is_alive():
|
||||
exit_code = self._process.exitcode
|
||||
logger.error("Worker process died (exitcode=%s)", exit_code)
|
||||
self._handle_crash(f"Worker process exited with code {exit_code}")
|
||||
return
|
||||
|
||||
# Worker alive but hasn't responded for too long (hung during inference)
|
||||
if self._busy:
|
||||
elapsed = time.monotonic() - self._last_result_time
|
||||
if elapsed > INFERENCE_WORKER_TIMEOUT_S:
|
||||
logger.error(
|
||||
"Worker timeout: no response for %.1f s — restarting", elapsed
|
||||
)
|
||||
self._process.terminate()
|
||||
self._process.join(timeout=2.0)
|
||||
self._handle_crash("Worker timed out (hung during inference)")
|
||||
|
||||
def _handle_crash(self, reason: str) -> None:
|
||||
"""Decide whether to auto-restart or give up."""
|
||||
# Clean up process handles (already dead)
|
||||
self._poll_timer.stop()
|
||||
self._watchdog_timer.stop()
|
||||
self._process = None
|
||||
self._busy = False
|
||||
|
||||
if self._restart_count < INFERENCE_MAX_RESTARTS:
|
||||
self._restart_count += 1
|
||||
logger.warning(
|
||||
"Auto-restarting worker (attempt %d/%d): %s",
|
||||
self._restart_count, INFERENCE_MAX_RESTARTS, reason,
|
||||
)
|
||||
self._start_worker()
|
||||
else:
|
||||
msg = (
|
||||
f"Inference worker failed after {INFERENCE_MAX_RESTARTS} restarts. "
|
||||
f"Last error: {reason}"
|
||||
)
|
||||
logger.error(msg)
|
||||
self.inference_error.emit(msg)
|
||||
Reference in New Issue
Block a user