feat!: reorganize detection and tracking pipeline

Refactor the package into common, schema, detection, and tracking namespaces and move dataset-specific ActualTest utilities into tests/support. Add a pluggable detection stack with typed protocols, pydantic-settings config, loguru-based runner logging, cvmmap and headless video sources, NATS and parquet sinks, and a structured coco-wholebody133 payload path. Teach tracking replay loading to consume parquet detection directories directly, preserve empty frames, and keep the video-to-parquet-to-tracking workflow usable for offline E2E runs. Vendor the local mmcv and xtcocotools wheels under Git LFS, update uv sources/lock state, and refresh the mmcv build so mmcv.ops loads successfully with the current torch+cu130 environment.
2026-03-26 16:24:27 +08:00
parent f1a2372b3c
commit 2c0d51ab31
56 changed files with 5179 additions and 889 deletions
@@ -0,0 +1,223 @@
+from collections.abc import AsyncIterator, Sequence
+from pathlib import Path
+
+import anyio
+import numpy as np
+import pytest
+
+from pose_tracking_exp.detection.config import (
+    DetectionRunnerConfig,
+    load_detection_runner_config,
+    resolve_instances,
+)
+from pose_tracking_exp.detection.runner import (
+    PendingFrame,
+    SourceSlot,
+    run_detection_runner,
+    store_latest_frame,
+    take_pending_batch,
+)
+from pose_tracking_exp.schema.detection import PoseDetections, SourceFrame
+
+
+def test_load_detection_runner_config_from_toml_and_env(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_path = tmp_path / "runner.toml"
+    config_path.write_text(
+        "\n".join(
+            [
+                'instances = ["front_left", "front_right"]',
+                'device = "cuda:1"',
+                'nats_host = "nats://localhost:4222"',
+                'yolo_checkpoint = "checkpoint/yolo/yolo11_mix_epoch10.pt"',
+                'pose_checkpoint = "checkpoint/dwpose/best_coco-wholebody_AP_epoch_50.pth"',
+                "bbox_area_threshold = 2500",
+                "max_batch_frames = 6",
+                "max_batch_wait_ms = 3",
+            ]
+        ),
+        encoding="utf-8",
+    )
+
+    monkeypatch.setenv("POSE_TRACKING_EXP_DETECTION_DEVICE", "cpu")
+    config = load_detection_runner_config(config_path)
+
+    assert config.instances == ("front_left", "front_right")
+    assert config.device == "cpu"
+    assert config.nats_host == "nats://localhost:4222"
+    assert config.bbox_area_threshold == 2500
+    assert config.max_batch_frames == 6
+    assert config.max_batch_wait_ms == 3
+
+
+def test_resolve_instances_prefers_cli_values() -> None:
+    assert resolve_instances(("cli_a", "cli_b"), ("cfg_a",)) == ("cli_a", "cli_b")
+
+
+def test_resolve_instances_falls_back_to_config_values() -> None:
+    assert resolve_instances((), ("cfg_a", "cfg_b")) == ("cfg_a", "cfg_b")
+
+
+def test_store_latest_frame_overwrites_pending_frame() -> None:
+    slot = SourceSlot(source_name="front_left")
+    first = SourceFrame(
+        source_name="front_left",
+        image_bgr=np.zeros((1, 1, 3), dtype=np.uint8),
+        frame_index=1,
+        timestamp_unix_ns=100,
+    )
+    second = SourceFrame(
+        source_name="front_left",
+        image_bgr=np.ones((1, 1, 3), dtype=np.uint8),
+        frame_index=2,
+        timestamp_unix_ns=200,
+    )
+
+    store_latest_frame(slot, first)
+    store_latest_frame(slot, second)
+
+    assert slot.received_frames == 2
+    assert slot.dropped_frames == 1
+    assert slot.pending_frame is not None
+    assert slot.pending_frame.frame is second
+
+
+def test_take_pending_batch_collects_at_most_one_frame_per_source() -> None:
+    slots = {
+        "front_left": SourceSlot(
+            source_name="front_left",
+            pending_frame=PendingFrame(
+                source_name="front_left",
+                frame=SourceFrame(
+                    source_name="front_left",
+                    image_bgr=np.zeros((1, 1, 3), dtype=np.uint8),
+                    frame_index=11,
+                    timestamp_unix_ns=110,
+                ),
+            ),
+        ),
+        "front_right": SourceSlot(
+            source_name="front_right",
+            pending_frame=PendingFrame(
+                source_name="front_right",
+                frame=SourceFrame(
+                    source_name="front_right",
+                    image_bgr=np.zeros((1, 1, 3), dtype=np.uint8),
+                    frame_index=22,
+                    timestamp_unix_ns=220,
+                ),
+            ),
+        ),
+        "rear": SourceSlot(
+            source_name="rear",
+            pending_frame=PendingFrame(
+                source_name="rear",
+                frame=SourceFrame(
+                    source_name="rear",
+                    image_bgr=np.zeros((1, 1, 3), dtype=np.uint8),
+                    frame_index=33,
+                    timestamp_unix_ns=330,
+                ),
+            ),
+        ),
+    }
+
+    batch = take_pending_batch(slots, max_batch_frames=2)
+
+    assert [frame.source_name for frame in batch] == ["front_left", "front_right"]
+    assert slots["front_left"].pending_frame is None
+    assert slots["front_right"].pending_frame is None
+    assert slots["rear"].pending_frame is not None
+
+
+class StubSource:
+    def __init__(self, source_name: str, frames: tuple[SourceFrame, ...]) -> None:
+        self.source_name = source_name
+        self._frames = frames
+
+    async def frames(self) -> AsyncIterator[SourceFrame]:
+        for frame in self._frames:
+            yield frame
+
+
+class StubPoseShim:
+    def process_many(self, frames: Sequence[SourceFrame]) -> list[PoseDetections]:
+        detections: list[PoseDetections] = []
+        for frame in frames:
+            detections.append(
+                PoseDetections(
+                    source_name=frame.source_name,
+                    frame_index=frame.frame_index,
+                    source_size=(frame.image_bgr.shape[1], frame.image_bgr.shape[0]),
+                    boxes_xyxy=np.asarray([[0.0, 0.0, 10.0, 10.0]], dtype=np.float32),
+                    box_scores=np.asarray([1.0], dtype=np.float32),
+                    keypoints_xy=np.zeros((1, 133, 2), dtype=np.float32),
+                    keypoint_scores=np.ones((1, 133), dtype=np.float32),
+                    timestamp_unix_ns=frame.timestamp_unix_ns,
+                    keypoint_schema="coco_wholebody133",
+                )
+            )
+        return detections
+
+
+class StubSink:
+    def __init__(self) -> None:
+        self.messages: list[PoseDetections] = []
+        self.closed = False
+
+    async def publish_pose(self, detections: PoseDetections) -> None:
+        self.messages.append(detections)
+
+    async def aclose(self) -> None:
+        self.closed = True
+
+
+def test_run_detection_runner_publishes_payloads() -> None:
+    sink = StubSink()
+    sources = (
+        StubSource(
+            "cam0",
+            (
+                SourceFrame(
+                    source_name="cam0",
+                    image_bgr=np.zeros((2, 3, 3), dtype=np.uint8),
+                    frame_index=1,
+                    timestamp_unix_ns=100,
+                ),
+            ),
+        ),
+        StubSource(
+            "cam1",
+            (
+                SourceFrame(
+                    source_name="cam1",
+                    image_bgr=np.zeros((2, 3, 3), dtype=np.uint8),
+                    frame_index=2,
+                    timestamp_unix_ns=200,
+                ),
+            ),
+        ),
+    )
+    config = DetectionRunnerConfig(
+        instances=("cam0", "cam1"),
+        pose_config_path=Path(__file__),
+        yolo_checkpoint=Path(__file__),
+        pose_checkpoint=Path(__file__),
+        max_batch_frames=2,
+    )
+
+    anyio.run(
+        run_detection_runner,
+        sources,
+        StubPoseShim(),
+        sink,
+        config,
+    )
+
+    assert sink.closed is True
+    assert [(item.source_name, item.frame_index, item.timestamp_unix_ns) for item in sink.messages] == [
+        ("cam0", 1, 100),
+        ("cam1", 2, 200),
+    ]