From 48409ed15045231010bea71a34a750bacf7dd3f6 Mon Sep 17 00:00:00 2001
From: Paul Nechifor <paul@nechifor.net>
Date: Tue, 20 Jan 2026 05:19:21 +0200
Subject: [PATCH 1/4] fix more tests

---
 .gitignore                                    |  1 +
 bin/pytest-fast                               |  6 ++
 bin/pytest-mujoco                             |  6 ++
 bin/pytest-slow                               |  2 +-
 dimos/e2e_tests/dimos_cli_call.py             |  6 +-
 dimos/e2e_tests/test_control_orchestrator.py  |  8 +-
 dimos/e2e_tests/test_person_follow.py         |  2 +-
 dimos/e2e_tests/test_spatial_memory.py        |  2 +-
 .../contact_graspnet_pytorch/inference.py     | 11 +--
 .../test_contact_graspnet.py                  |  1 +
 dimos/models/vl/test_vlm.py                   |  8 ++
 .../sensor_msgs/image_impls/AbstractImage.py  | 25 ++++++
 .../msgs/sensor_msgs/image_impls/CudaImage.py | 15 +++-
 .../image_impls/test_image_backends.py        |  2 +-
 .../test_wavefront_frontier_goal_selector.py  | 86 -------------------
 .../reid/test_embedding_id_system.py          | 80 +++++++++--------
 .../test_temporal_memory_module.py            |  2 +-
 .../perception/test_spatial_memory_module.py  |  1 +
 dimos/protocol/pubsub/test_spec.py            |  1 +
 .../robot/unitree_webrtc/mujoco_connection.py | 13 +++
 .../robot/unitree_webrtc/testing/test_mock.py | 62 -------------
 dimos/robot/unitree_webrtc/type/test_map.py   | 80 -----------------
 .../unitree_webrtc/unitree_go2_blueprints.py  |  8 +-
 pyproject.toml                                |  9 +-
 24 files changed, 138 insertions(+), 299 deletions(-)
 create mode 100755 bin/pytest-fast
 create mode 100755 bin/pytest-mujoco
 delete mode 100644 dimos/robot/unitree_webrtc/testing/test_mock.py
 delete mode 100644 dimos/robot/unitree_webrtc/type/test_map.py

diff --git a/.gitignore b/.gitignore
index 0e6781f3a8..e52d08ba32 100644
--- a/.gitignore
+++ b/.gitignore
@@ -63,3 +63,4 @@ yolo11n.pt
 /.mypy_cache*
 
 *mobileclip*
+/results
diff --git a/bin/pytest-fast b/bin/pytest-fast
new file mode 100755
index 0000000000..cb25f93288
--- /dev/null
+++ b/bin/pytest-fast
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+
+set -euo pipefail
+
+. .venv/bin/activate
+exec pytest "$@" dimos
diff --git a/bin/pytest-mujoco b/bin/pytest-mujoco
new file mode 100755
index 0000000000..07e7ed90bc
--- /dev/null
+++ b/bin/pytest-mujoco
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+
+set -euo pipefail
+
+. .venv/bin/activate
+exec pytest "$@" -m mujoco dimos
diff --git a/bin/pytest-slow b/bin/pytest-slow
index 702445ec85..85643d4413 100755
--- a/bin/pytest-slow
+++ b/bin/pytest-slow
@@ -3,4 +3,4 @@
 set -euo pipefail
 
 . .venv/bin/activate
-exec pytest "$@" -m 'not (tool or cuda or gpu or module or temporal)' dimos
+exec pytest "$@" -m 'not (tool or module or neverending or mujoco)' dimos
diff --git a/dimos/e2e_tests/dimos_cli_call.py b/dimos/e2e_tests/dimos_cli_call.py
index 956b30a086..2e987cf7ad 100644
--- a/dimos/e2e_tests/dimos_cli_call.py
+++ b/dimos/e2e_tests/dimos_cli_call.py
@@ -28,7 +28,11 @@ def start(self) -> None:
         if self.demo_args is None:
             raise ValueError("Demo args must be set before starting the process.")
 
-        self.process = subprocess.Popen(["dimos", "--simulation", *self.demo_args])
+        args = list(self.demo_args)
+        if len(args) == 1:
+            args = ["run", *args]
+
+        self.process = subprocess.Popen(["dimos", "--simulation", *args])
 
     def stop(self) -> None:
         if self.process is None:
diff --git a/dimos/e2e_tests/test_control_orchestrator.py b/dimos/e2e_tests/test_control_orchestrator.py
index 967a219ceb..aa820d66ec 100644
--- a/dimos/e2e_tests/test_control_orchestrator.py
+++ b/dimos/e2e_tests/test_control_orchestrator.py
@@ -125,7 +125,7 @@ def test_orchestrator_executes_trajectory(self, lcm_spy, start_blueprint) -> Non
 
             while time.time() - start_time < timeout:
                 status = client.get_trajectory_status("traj_arm")
-                if status is not None and status.get("state") == TrajectoryState.COMPLETED.name:
+                if status is not None and status.state == TrajectoryState.COMPLETED.name:
                     completed = True
                     break
                 time.sleep(0.1)
@@ -205,7 +205,7 @@ def test_orchestrator_cancel_trajectory(self, lcm_spy, start_blueprint) -> None:
             # Check status is ABORTED
             status = client.get_trajectory_status("traj_arm")
             assert status is not None
-            assert status.get("state") == TrajectoryState.ABORTED.name
+            assert status.state == TrajectoryState.ABORTED.name
         finally:
             client.stop_rpc_client()
 
@@ -258,7 +258,7 @@ def test_dual_arm_orchestrator(self, lcm_spy, start_blueprint) -> None:
             left_status = client.get_trajectory_status("traj_left")
             right_status = client.get_trajectory_status("traj_right")
 
-            assert left_status.get("state") == TrajectoryState.COMPLETED.name
-            assert right_status.get("state") == TrajectoryState.COMPLETED.name
+            assert left_status is not None and left_status.state == TrajectoryState.COMPLETED.name
+            assert right_status is not None and right_status.state == TrajectoryState.COMPLETED.name
         finally:
             client.stop_rpc_client()
diff --git a/dimos/e2e_tests/test_person_follow.py b/dimos/e2e_tests/test_person_follow.py
index 663dee420e..709f4e4511 100644
--- a/dimos/e2e_tests/test_person_follow.py
+++ b/dimos/e2e_tests/test_person_follow.py
@@ -55,7 +55,7 @@ def run_person_track() -> None:
 
 @pytest.mark.skipif(bool(os.getenv("CI")), reason="LCM spy doesn't work in CI.")
 @pytest.mark.skipif(not os.getenv("OPENAI_API_KEY"), reason="OPENAI_API_KEY not set.")
-@pytest.mark.e2e
+@pytest.mark.mujoco
 def test_person_follow(
     lcm_spy: LcmSpy,
     start_blueprint: Callable[[str], DimosCliCall],
diff --git a/dimos/e2e_tests/test_spatial_memory.py b/dimos/e2e_tests/test_spatial_memory.py
index 171f638f19..7c08800a6f 100644
--- a/dimos/e2e_tests/test_spatial_memory.py
+++ b/dimos/e2e_tests/test_spatial_memory.py
@@ -25,7 +25,7 @@
 
 @pytest.mark.skipif(bool(os.getenv("CI")), reason="LCM spy doesn't work in CI.")
 @pytest.mark.skipif(not os.getenv("OPENAI_API_KEY"), reason="OPENAI_API_KEY not set.")
-@pytest.mark.e2e
+@pytest.mark.mujoco
 def test_spatial_memory_navigation(
     lcm_spy: LcmSpy,
     start_blueprint: Callable[[str], DimosCliCall],
diff --git a/dimos/models/manipulation/contact_graspnet_pytorch/inference.py b/dimos/models/manipulation/contact_graspnet_pytorch/inference.py
index 0769fc150d..76bb377869 100644
--- a/dimos/models/manipulation/contact_graspnet_pytorch/inference.py
+++ b/dimos/models/manipulation/contact_graspnet_pytorch/inference.py
@@ -3,7 +3,6 @@
 import os
 
 from contact_graspnet_pytorch import config_utils  # type: ignore[import-not-found]
-from contact_graspnet_pytorch.checkpoints import CheckpointIO  # type: ignore[import-not-found]
 from contact_graspnet_pytorch.contact_grasp_estimator import (  # type: ignore[import-not-found]
     GraspEstimator,
 )
@@ -11,6 +10,7 @@
     load_available_input_data,
 )
 import numpy as np
+import torch
 
 from dimos.utils.data import get_data
 
@@ -45,12 +45,9 @@ def inference(global_config,  # type: ignore[no-untyped-def]
 
     # Load the weights
     model_checkpoint_dir = get_data(ckpt_dir)
-    checkpoint_io = CheckpointIO(checkpoint_dir=model_checkpoint_dir, model=grasp_estimator.model)
-    try:
-        checkpoint_io.load('model.pt')
-    except FileExistsError:
-        print('No model checkpoint found')
-
+    checkpoint_path = os.path.join(model_checkpoint_dir, 'model.pt')
+    state_dict = torch.load(checkpoint_path, weights_only=False)
+    grasp_estimator.model.load_state_dict(state_dict['model'])
 
     os.makedirs('results', exist_ok=True)
 
diff --git a/dimos/models/manipulation/contact_graspnet_pytorch/test_contact_graspnet.py b/dimos/models/manipulation/contact_graspnet_pytorch/test_contact_graspnet.py
index 7964a24954..7ee0f49451 100644
--- a/dimos/models/manipulation/contact_graspnet_pytorch/test_contact_graspnet.py
+++ b/dimos/models/manipulation/contact_graspnet_pytorch/test_contact_graspnet.py
@@ -13,6 +13,7 @@ def is_manipulation_installed() -> bool:
     except ImportError:
         return False
 
+@pytest.mark.integration
 @pytest.mark.skipif(not is_manipulation_installed(),
                    reason="This test requires 'pip install .[manipulation]' to be run")
 def test_contact_graspnet_inference() -> None:
diff --git a/dimos/models/vl/test_vlm.py b/dimos/models/vl/test_vlm.py
index 54e6c5111c..120dfb74fb 100644
--- a/dimos/models/vl/test_vlm.py
+++ b/dimos/models/vl/test_vlm.py
@@ -5,6 +5,7 @@
     ImageAnnotations,
 )
 import pytest
+import os
 
 from dimos.core import LCMTransport
 from dimos.models.vl.moondream import MoondreamVlModel
@@ -33,6 +34,9 @@
 )
 @pytest.mark.gpu
 def test_vlm_bbox_detections(model_class: "type[VlModel]", model_name: str) -> None:
+    if model_class is MoondreamHostedVlModel and 'MOONDREAM_API_KEY' not in os.environ:
+        pytest.skip("Need MOONDREAM_API_KEY to run")
+
     image = Image.from_file(get_data("cafe.jpg")).to_rgb()
 
     print(f"Testing {model_name}")
@@ -103,6 +107,10 @@ def test_vlm_bbox_detections(model_class: "type[VlModel]", model_name: str) -> N
 @pytest.mark.gpu
 def test_vlm_point_detections(model_class: "type[VlModel]", model_name: str) -> None:
     """Test VLM point detection capabilities."""
+
+    if model_class is MoondreamHostedVlModel and 'MOONDREAM_API_KEY' not in os.environ:
+        pytest.skip("Need MOONDREAM_API_KEY to run")
+
     image = Image.from_file(get_data("cafe.jpg")).to_rgb()
 
     print(f"Testing {model_name} point detection")
diff --git a/dimos/msgs/sensor_msgs/image_impls/AbstractImage.py b/dimos/msgs/sensor_msgs/image_impls/AbstractImage.py
index f5d92a3bc6..b71c5476fc 100644
--- a/dimos/msgs/sensor_msgs/image_impls/AbstractImage.py
+++ b/dimos/msgs/sensor_msgs/image_impls/AbstractImage.py
@@ -32,6 +32,31 @@
     cp = None
     HAS_CUDA = False
 
+# NVRTC defaults to C++11; libcu++ in recent CUDA requires at least C++17.
+if HAS_CUDA:
+    try:
+        import cupy.cuda.compiler as _cupy_compiler  # type: ignore[import-not-found]
+
+        if not getattr(_cupy_compiler, "_dimos_force_cxx17", False):
+            _orig_compile_using_nvrtc = _cupy_compiler.compile_using_nvrtc
+
+            def _compile_using_nvrtc(  # type: ignore[no-untyped-def]
+                source, options=(), *args, **kwargs
+            ):
+                filtered = tuple(
+                    opt
+                    for opt in options
+                    if opt not in ("-std=c++11", "--std=c++11", "-std=c++14", "--std=c++14")
+                )
+                if "--std=c++17" not in filtered and "-std=c++17" not in filtered:
+                    filtered = (*filtered, "--std=c++17")
+                return _orig_compile_using_nvrtc(source, filtered, *args, **kwargs)
+
+            _cupy_compiler.compile_using_nvrtc = _compile_using_nvrtc
+            _cupy_compiler._dimos_force_cxx17 = True
+    except Exception:
+        pass
+
 # Optional nvImageCodec (preferred GPU codec)
 USE_NVIMGCODEC = os.environ.get("USE_NVIMGCODEC", "0") == "1"
 NVIMGCODEC_LAST_USED = False
diff --git a/dimos/msgs/sensor_msgs/image_impls/CudaImage.py b/dimos/msgs/sensor_msgs/image_impls/CudaImage.py
index 8230daae29..cdfa1bf088 100644
--- a/dimos/msgs/sensor_msgs/image_impls/CudaImage.py
+++ b/dimos/msgs/sensor_msgs/image_impls/CudaImage.py
@@ -262,13 +262,20 @@
 } // extern "C"
 """
 
+_pnp_kernel = None
 if cp is not None:
-    _mod = cp.RawModule(code=_CUDA_SRC, options=("-std=c++14",), name_expressions=("pnp_gn_batch",))
-    _pnp_kernel = _mod.get_function("pnp_gn_batch")
+    try:
+        _mod = cp.RawModule(
+            code=_CUDA_SRC, options=("-std=c++17",), name_expressions=("pnp_gn_batch",)
+        )
+        _pnp_kernel = _mod.get_function("pnp_gn_batch")
+    except Exception:
+        # CUDA not available at runtime (e.g., no GPU or driver issues)
+        pass
 
 
 def _solve_pnp_cuda_kernel(obj, img, K, iterations: int = 15, damping: float = 1e-6):  # type: ignore[no-untyped-def]
-    if cp is None:
+    if cp is None or _pnp_kernel is None:
         raise RuntimeError("CuPy/CUDA not available")
 
     obj_cu = cp.asarray(obj, dtype=cp.float32)
@@ -709,7 +716,7 @@ def sharpness(self) -> float:
             magnitude = cp.hypot(gx, gy)
             mean_mag = float(cp.asnumpy(magnitude.mean()))
         except Exception:
-            return 0.0
+            raise
         if mean_mag <= 0:
             return 0.0
         return float(np.clip((np.log10(mean_mag + 1) - 1.7) / 2.0, 0.0, 1.0))
diff --git a/dimos/msgs/sensor_msgs/image_impls/test_image_backends.py b/dimos/msgs/sensor_msgs/image_impls/test_image_backends.py
index 0d3a3079dc..d3a5bf91e2 100644
--- a/dimos/msgs/sensor_msgs/image_impls/test_image_backends.py
+++ b/dimos/msgs/sensor_msgs/image_impls/test_image_backends.py
@@ -232,7 +232,7 @@ def test_sharpness(alloc_timer) -> None:
     if gpu is not None:
         s_gpu = gpu.sharpness
         # Values should be very close; minor border/rounding differences allowed
-        assert abs(s_cpu - s_gpu) < 0.6
+        assert abs(s_cpu - s_gpu) < 5e-2
 
 
 def test_to_opencv(alloc_timer) -> None:
diff --git a/dimos/navigation/frontier_exploration/test_wavefront_frontier_goal_selector.py b/dimos/navigation/frontier_exploration/test_wavefront_frontier_goal_selector.py
index aca154a6dd..20597dc87b 100644
--- a/dimos/navigation/frontier_exploration/test_wavefront_frontier_goal_selector.py
+++ b/dimos/navigation/frontier_exploration/test_wavefront_frontier_goal_selector.py
@@ -312,92 +312,6 @@ def test_exploration_with_no_gain_detection() -> None:
         explorer.stop()
 
 
-@pytest.mark.vis
-def test_frontier_detection_visualization() -> None:
-    """Test frontier detection with visualization (marked with @pytest.mark.vis)."""
-    # Get test costmap
-    costmap, first_lidar = create_test_costmap()
-
-    # Initialize frontier explorer with default parameters
-    explorer = WavefrontFrontierExplorer()
-
-    try:
-        # Use lidar origin as robot position
-        robot_pose = first_lidar.origin
-
-        # Detect all frontiers for visualization
-        all_frontiers = explorer.detect_frontiers(robot_pose, costmap)
-
-        # Get selected goal
-        selected_goal = explorer.get_exploration_goal(robot_pose, costmap)
-
-        print(f"Visualizing {len(all_frontiers)} frontier candidates")
-        if selected_goal:
-            print(f"Selected goal: ({selected_goal.x:.2f}, {selected_goal.y:.2f})")
-
-        # Create visualization
-        image_scale_factor = 4
-        base_image = costmap_to_pil_image(costmap, image_scale_factor)
-
-        # Helper function to convert world coordinates to image coordinates
-        def world_to_image_coords(world_pos: Vector3) -> tuple[int, int]:
-            grid_pos = costmap.world_to_grid(world_pos)
-            img_x = int(grid_pos.x * image_scale_factor)
-            img_y = int((costmap.height - grid_pos.y) * image_scale_factor)  # Flip Y
-            return img_x, img_y
-
-        # Draw visualization
-        draw = ImageDraw.Draw(base_image)
-
-        # Draw frontier candidates as gray dots
-        for frontier in all_frontiers[:20]:  # Limit to top 20
-            x, y = world_to_image_coords(frontier)
-            radius = 6
-            draw.ellipse(
-                [x - radius, y - radius, x + radius, y + radius],
-                fill=(128, 128, 128),  # Gray
-                outline=(64, 64, 64),
-                width=1,
-            )
-
-        # Draw robot position as blue dot
-        robot_x, robot_y = world_to_image_coords(robot_pose)
-        robot_radius = 10
-        draw.ellipse(
-            [
-                robot_x - robot_radius,
-                robot_y - robot_radius,
-                robot_x + robot_radius,
-                robot_y + robot_radius,
-            ],
-            fill=(0, 0, 255),  # Blue
-            outline=(0, 0, 128),
-            width=3,
-        )
-
-        # Draw selected goal as red dot
-        if selected_goal:
-            goal_x, goal_y = world_to_image_coords(selected_goal)
-            goal_radius = 12
-            draw.ellipse(
-                [
-                    goal_x - goal_radius,
-                    goal_y - goal_radius,
-                    goal_x + goal_radius,
-                    goal_y + goal_radius,
-                ],
-                fill=(255, 0, 0),  # Red
-                outline=(128, 0, 0),
-                width=3,
-            )
-
-        # Display the image
-        base_image.show(title="Frontier Detection - Office Lidar")
-        print("Visualization displayed. Close the image window to continue.")
-    finally:
-        explorer.stop()
-
-
 def test_performance_timing() -> None:
     """Test performance by timing frontier detection operations."""
     import time
diff --git a/dimos/perception/detection/reid/test_embedding_id_system.py b/dimos/perception/detection/reid/test_embedding_id_system.py
index 3a0899c848..b9e6f591ee 100644
--- a/dimos/perception/detection/reid/test_embedding_id_system.py
+++ b/dimos/perception/detection/reid/test_embedding_id_system.py
@@ -12,8 +12,8 @@
 # See the License for the specific language governing permissions and
 # limitations under the License.
 
+import numpy as np
 import pytest
-import torch
 
 from dimos.msgs.sensor_msgs import Image
 from dimos.perception.detection.reid.embedding_id_system import EmbeddingIDSystem
@@ -25,8 +25,7 @@ def mobileclip_model():
     """Load MobileCLIP model once for all tests."""
     from dimos.models.embedding.mobileclip import MobileCLIPModel
 
-    model_path = get_data("models_mobileclip") / "mobileclip2_s0.pt"
-    model = MobileCLIPModel(model_name="MobileCLIP2-S0", model_path=model_path)
+    model = MobileCLIPModel()  # Uses default MobileCLIP2-S4
     model.start()
     return model
 
@@ -34,7 +33,11 @@ def mobileclip_model():
 @pytest.fixture
 def track_associator(mobileclip_model):
     """Create fresh EmbeddingIDSystem for each test."""
-    return EmbeddingIDSystem(model=lambda: mobileclip_model, similarity_threshold=0.75)
+    return EmbeddingIDSystem(
+        model=lambda: mobileclip_model,
+        similarity_threshold=0.75,
+        min_embeddings_for_matching=1,  # Allow matching with single embedding for tests
+    )
 
 
 @pytest.fixture(scope="session")
@@ -52,39 +55,40 @@ def test_update_embedding_single(track_associator, mobileclip_model, test_image)
     track_associator.update_embedding(track_id=1, new_embedding=embedding)
 
     assert 1 in track_associator.track_embeddings
-    assert track_associator.embedding_counts[1] == 1
+    assert len(track_associator.track_embeddings[1]) == 1
 
-    # Verify embedding is on device and normalized
-    emb_vec = track_associator.track_embeddings[1]
-    assert isinstance(emb_vec, torch.Tensor)
-    assert emb_vec.device.type in ["cuda", "cpu"]
-    norm = torch.norm(emb_vec).item()
+    # Verify embedding is stored as numpy array and normalized
+    emb_vec = track_associator.track_embeddings[1][0]
+    assert isinstance(emb_vec, np.ndarray)
+    norm = np.linalg.norm(emb_vec)
     assert abs(norm - 1.0) < 0.01, "Embedding should be normalized"
 
 
 @pytest.mark.gpu
-def test_update_embedding_running_average(track_associator, mobileclip_model, test_image) -> None:
-    """Test running average of embeddings."""
+def test_update_embedding_multiple(track_associator, mobileclip_model, test_image) -> None:
+    """Test storing multiple embeddings per track."""
     embedding1 = mobileclip_model.embed(test_image)
     embedding2 = mobileclip_model.embed(test_image)
 
     # Add first embedding
     track_associator.update_embedding(track_id=1, new_embedding=embedding1)
-    first_vec = track_associator.track_embeddings[1].clone()
+    first_vec = track_associator.track_embeddings[1][0].copy()
 
     # Add second embedding (same image, should be very similar)
     track_associator.update_embedding(track_id=1, new_embedding=embedding2)
-    avg_vec = track_associator.track_embeddings[1]
 
-    assert track_associator.embedding_counts[1] == 2
+    # Should have 2 embeddings now
+    assert len(track_associator.track_embeddings[1]) == 2
 
-    # Average should still be normalized
-    norm = torch.norm(avg_vec).item()
-    assert abs(norm - 1.0) < 0.01, "Average embedding should be normalized"
+    # Both should be normalized
+    for emb in track_associator.track_embeddings[1]:
+        norm = np.linalg.norm(emb)
+        assert abs(norm - 1.0) < 0.01, "Embedding should be normalized"
 
-    # Average should be similar to both originals (same image)
-    similarity1 = (first_vec @ avg_vec).item()
-    assert similarity1 > 0.99, "Average should be very similar to original"
+    # Second embedding should be similar to first (same image)
+    second_vec = track_associator.track_embeddings[1][1]
+    similarity = float(np.dot(first_vec, second_vec))
+    assert similarity > 0.99, "Same image should produce very similar embeddings"
 
 
 @pytest.mark.gpu
@@ -199,31 +203,33 @@ def test_associate_returns_cached(track_associator, mobileclip_model, test_image
 
 
 @pytest.mark.gpu
-def test_associate_not_ready(track_associator) -> None:
-    """Test that associate returns -1 for track without embedding."""
+def test_associate_no_embedding(track_associator) -> None:
+    """Test that associate creates new ID for track without embedding."""
+    # Track with no embedding gets assigned a new ID
     long_term_id = track_associator.associate(track_id=999)
-    assert long_term_id == -1, "Should return -1 for track without embedding"
+    assert long_term_id == 0, "Track without embedding should get new long_term_id"
+    assert track_associator.long_term_counter == 1
 
 
 @pytest.mark.gpu
-def test_gpu_performance(track_associator, mobileclip_model, test_image) -> None:
-    """Test that embeddings stay on GPU for performance."""
+def test_embeddings_stored_as_numpy(track_associator, mobileclip_model, test_image) -> None:
+    """Test that embeddings are stored as numpy arrays for efficient CPU comparisons."""
     embedding = mobileclip_model.embed(test_image)
     track_associator.update_embedding(track_id=1, new_embedding=embedding)
 
-    # Embedding should stay on device
-    emb_vec = track_associator.track_embeddings[1]
-    assert isinstance(emb_vec, torch.Tensor)
-    # Device comparison (handle "cuda" vs "cuda:0")
-    expected_device = mobileclip_model.device
-    assert emb_vec.device.type == torch.device(expected_device).type
+    # Embeddings should be stored as numpy arrays
+    emb_list = track_associator.track_embeddings[1]
+    assert isinstance(emb_list, list)
+    assert len(emb_list) == 1
+    assert isinstance(emb_list[0], np.ndarray)
 
-    # Running average should happen on GPU
+    # Add more embeddings
     embedding2 = mobileclip_model.embed(test_image)
     track_associator.update_embedding(track_id=1, new_embedding=embedding2)
 
-    avg_vec = track_associator.track_embeddings[1]
-    assert avg_vec.device.type == torch.device(expected_device).type
+    assert len(track_associator.track_embeddings[1]) == 2
+    for emb in track_associator.track_embeddings[1]:
+        assert isinstance(emb, np.ndarray)
 
 
 @pytest.mark.gpu
@@ -247,12 +253,12 @@ def test_multi_track_scenario(track_associator, mobileclip_model, test_image) ->
 
     # Frame 2: Track 1 and Track 2 appear (different objects)
     text_emb = mobileclip_model.embed_text("a dog")
-    track_associator.update_embedding(1, emb1)  # Update average
+    track_associator.update_embedding(1, emb1)  # Update embedding
     track_associator.update_embedding(2, text_emb)
     track_associator.add_negative_constraints([1, 2])  # Co-occur = different
     lt2 = track_associator.associate(2)
 
-    # Track 2 should get different ID despite any similarity
+    # Track 2 should get different ID due to negative constraint
     assert lt1 != lt2
 
     # Frame 3: Track 1 disappears, Track 3 appears (same as Track 1)
diff --git a/dimos/perception/experimental/temporal_memory/test_temporal_memory_module.py b/dimos/perception/experimental/temporal_memory/test_temporal_memory_module.py
index 8029bd6454..7b38e4ce40 100644
--- a/dimos/perception/experimental/temporal_memory/test_temporal_memory_module.py
+++ b/dimos/perception/experimental/temporal_memory/test_temporal_memory_module.py
@@ -81,7 +81,7 @@ def stop(self) -> None:
 
 @pytest.mark.skipif(bool(os.getenv("CI")), reason="LCM replay + dataset not CI-safe.")
 @pytest.mark.skipif(not os.getenv("OPENAI_API_KEY"), reason="OPENAI_API_KEY not set.")
-@pytest.mark.temporal  # TODO: This never finishes for me.
+@pytest.mark.neverending
 class TestTemporalMemoryModule:
     @pytest.fixture(scope="function")
     def temp_dir(self):
diff --git a/dimos/perception/test_spatial_memory_module.py b/dimos/perception/test_spatial_memory_module.py
index 48a2b2750f..47518b889b 100644
--- a/dimos/perception/test_spatial_memory_module.py
+++ b/dimos/perception/test_spatial_memory_module.py
@@ -110,6 +110,7 @@ def stop(self) -> None:
 
 
 @pytest.mark.gpu
+@pytest.mark.neverending
 class TestSpatialMemoryModule:
     @pytest.fixture(scope="function")
     def temp_dir(self):
diff --git a/dimos/protocol/pubsub/test_spec.py b/dimos/protocol/pubsub/test_spec.py
index a82728177e..357e1dfa1e 100644
--- a/dimos/protocol/pubsub/test_spec.py
+++ b/dimos/protocol/pubsub/test_spec.py
@@ -311,6 +311,7 @@ async def consume_messages() -> None:
         assert received_messages == messages_to_send
 
 
+@pytest.mark.integration
 @pytest.mark.parametrize("pubsub_context, topic, values", testdata)
 def test_high_volume_messages(
     pubsub_context: Callable[[], Any], topic: Any, values: list[Any]
diff --git a/dimos/robot/unitree_webrtc/mujoco_connection.py b/dimos/robot/unitree_webrtc/mujoco_connection.py
index 1ee00c1925..d4a7736fc2 100644
--- a/dimos/robot/unitree_webrtc/mujoco_connection.py
+++ b/dimos/robot/unitree_webrtc/mujoco_connection.py
@@ -15,6 +15,7 @@
 # limitations under the License.
 
 
+import atexit
 import base64
 from collections.abc import Callable
 import functools
@@ -25,6 +26,7 @@
 import threading
 import time
 from typing import Any, TypeVar
+import weakref
 
 import numpy as np
 from numpy.typing import NDArray
@@ -121,6 +123,7 @@ def start(self) -> None:
         try:
             # mjpython must be used macOS (because of launch_passive inside mujoco_process.py)
             executable = sys.executable if sys.platform != "darwin" else "mjpython"
+
             self.process = subprocess.Popen(
                 [executable, str(LAUNCHER_PATH), config_pickle, shm_names_json],
             )
@@ -140,6 +143,16 @@ def start(self) -> None:
                 raise RuntimeError(f"MuJoCo process failed to start (exit code {exit_code})")
             if self.shm_data.is_ready():
                 logger.info("MuJoCo process started successfully")
+                # Register atexit handler to ensure subprocess is cleaned up
+                # Use weakref to avoid preventing garbage collection
+                weak_self = weakref.ref(self)
+
+                def cleanup_on_exit() -> None:
+                    instance = weak_self()
+                    if instance is not None:
+                        instance.stop()
+
+                atexit.register(cleanup_on_exit)
                 return
             time.sleep(0.1)
 
diff --git a/dimos/robot/unitree_webrtc/testing/test_mock.py b/dimos/robot/unitree_webrtc/testing/test_mock.py
deleted file mode 100644
index fbdb614d63..0000000000
--- a/dimos/robot/unitree_webrtc/testing/test_mock.py
+++ /dev/null
@@ -1,62 +0,0 @@
-#!/usr/bin/env python3
-# Copyright 2025-2026 Dimensional Inc.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import time
-
-import pytest
-
-from dimos.msgs.sensor_msgs import PointCloud2
-from dimos.robot.unitree_webrtc.testing.mock import Mock
-
-
-@pytest.mark.needsdata
-def test_mock_load_cast() -> None:
-    mock = Mock("test")
-
-    # Load a frame with type casting
-    frame = mock.load("a")
-
-    # Verify it's a PointCloud2 object
-    assert frame.__class__.__name__ == "PointCloud2"
-    assert hasattr(frame, "ts")
-    assert hasattr(frame, "pointcloud")
-
-    # Verify pointcloud has points
-    assert frame.pointcloud.has_points()
-    assert len(frame.pointcloud.points) > 0
-
-
-@pytest.mark.needsdata
-def test_mock_iterate() -> None:
-    """Test the iterate method of the Mock class."""
-    mock = Mock("office")
-
-    # Test iterate method
-    frames = list(mock.iterate())
-    assert len(frames) > 0
-    for frame in frames:
-        assert isinstance(frame, PointCloud2)
-        assert frame.pointcloud.has_points()
-
-
-@pytest.mark.needsdata
-def test_mock_stream() -> None:
-    frames = []
-    sub1 = Mock("office").stream(rate_hz=30.0).subscribe(on_next=frames.append)
-    time.sleep(0.1)
-    sub1.dispose()
-
-    assert len(frames) >= 2
-    assert isinstance(frames[0], PointCloud2)
diff --git a/dimos/robot/unitree_webrtc/type/test_map.py b/dimos/robot/unitree_webrtc/type/test_map.py
deleted file mode 100644
index 0c55db1e4e..0000000000
--- a/dimos/robot/unitree_webrtc/type/test_map.py
+++ /dev/null
@@ -1,80 +0,0 @@
-# Copyright 2025-2026 Dimensional Inc.
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-
-import pytest
-
-from dimos.mapping.pointclouds.accumulators.general import _splice_cylinder
-from dimos.robot.unitree_webrtc.testing.helpers import show3d
-from dimos.robot.unitree_webrtc.testing.mock import Mock
-from dimos.robot.unitree_webrtc.type.lidar import pointcloud2_from_webrtc_lidar
-from dimos.robot.unitree_webrtc.type.map import Map
-from dimos.utils.testing import SensorReplay
-
-
-@pytest.mark.vis
-def test_costmap_vis() -> None:
-    map = Map()
-    map.start()
-    mock = Mock("office")
-    frames = list(mock.iterate())
-
-    for frame in frames:
-        print(frame)
-        map.add_frame(frame)
-
-    # Get global map and costmap
-    global_map = map.to_PointCloud2()
-    print(f"Global map has {len(global_map.pointcloud.points)} points")
-    show3d(global_map.pointcloud, title="Global Map").run()
-
-
-@pytest.mark.vis
-def test_reconstruction_with_realtime_vis() -> None:
-    map = Map()
-    map.start()
-    mock = Mock("office")
-
-    # Process frames and visualize final map
-    for frame in mock.iterate():
-        map.add_frame(frame)
-
-    show3d(map.o3d_geometry, title="Reconstructed Map").run()
-
-
-@pytest.mark.vis
-def test_splice_vis() -> None:
-    mock = Mock("test")
-    target = mock.load("a")
-    insert = mock.load("b")
-    show3d(_splice_cylinder(target.pointcloud, insert.pointcloud, shrink=0.7)).run()
-
-
-@pytest.mark.vis
-def test_robot_vis() -> None:
-    map = Map()
-    map.start()
-    mock = Mock("office")
-
-    # Process all frames
-    for frame in mock.iterate():
-        map.add_frame(frame)
-
-    show3d(map.o3d_geometry, title="global dynamic map test").run()
-
-
-@pytest.fixture
-def map_():
-    map = Map(voxel_size=0.5)
-    yield map
-    map.stop()
diff --git a/dimos/robot/unitree_webrtc/unitree_go2_blueprints.py b/dimos/robot/unitree_webrtc/unitree_go2_blueprints.py
index c9ea8ae6cf..0d23b839bd 100644
--- a/dimos/robot/unitree_webrtc/unitree_go2_blueprints.py
+++ b/dimos/robot/unitree_webrtc/unitree_go2_blueprints.py
@@ -160,13 +160,7 @@
 
 spatial = autoconnect(
     nav,
-    # TODO: Turn back on. Turned off to stop logging.
-    # EEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEE
-    # EEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEE
-    # EEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEE
-    # EEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEE
-    # EEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEEE
-    # spatial_memory(),
+    spatial_memory(),
     utilization(),
 ).global_config(n_dask_workers=8)
 
diff --git a/pyproject.toml b/pyproject.toml
index 91b1a1288d..f3752d0894 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -346,24 +346,21 @@ follow_imports = "skip"
 testpaths = ["dimos"]
 markers = [
     "heavy: resource heavy test",
-    "vis: marks tests that run visuals and require a visual check by dev",
-    "benchmark: benchmark, executes something multiple times, calculates avg, prints to console",
-    "exclude: arbitrary exclusion from CI and default test exec",
     "tool: dev tooling",
-    "needsdata: needs test data to be downloaded",
     "ros: depend on ros",
     "lcm: tests that run actual LCM bus (can't execute in CI)",
     "module: tests that need to run directly as modules",
     "gpu: tests that require GPU",
     "tofix: temporarily disabled test",
     "e2e: end to end tests",
-    "temporal: not working for me",
     "integration: slower integration tests",
+    "neverending: they don't finish",
+    "mujoco: tests which open mujoco",
 ]
 env = [
   "GOOGLE_MAPS_API_KEY=AIzafake_google_key"
 ]
-addopts = "-v -p no:warnings -ra --color=yes -m 'not (vis or benchmark or exclude or tool or needsdata or lcm or ros or heavy or gpu or module or tofix or e2e or temporal or integration)'"
+addopts = "-v -p no:warnings -ra --color=yes -m 'not (vis or exclude or tool or lcm or ros or heavy or gpu or module or tofix or e2e or integration or neverending or mujoco)'"
 asyncio_mode = "auto"
 asyncio_default_fixture_loop_scope = "function"
 

From 18b14517b9e53bfc370b4b6eaae70537f60ab27f Mon Sep 17 00:00:00 2001
From: Paul Nechifor <paul@nechifor.net>
Date: Wed, 21 Jan 2026 06:45:51 +0200
Subject: [PATCH 2/4] fix imports

---
 dimos/agents/vlm_agent.py                         |  2 +-
 dimos/control/blueprints.py                       |  1 -
 dimos/control/hardware_interface.py               |  2 +-
 dimos/control/orchestrator.py                     |  1 -
 dimos/models/vl/test_vlm.py                       |  2 +-
 .../test_wavefront_frontier_goal_selector.py      |  2 --
 .../temporal_memory/temporal_memory.py            |  1 -
 .../temporal_memory/temporal_memory_example.py    |  1 -
 .../temporal_memory/temporal_utils/graph_utils.py |  1 -
 dimos/protocol/pubsub/benchmark/type.py           | 15 ++-------------
 dimos/protocol/pubsub/test_rospubsub.py           |  1 -
 dimos/robot/drone/test_drone.py                   |  1 -
 dimos/robot/unitree_webrtc/modular/detect.py      |  1 -
 .../unitree_webrtc/unitree_go2_blueprints.py      |  1 -
 14 files changed, 5 insertions(+), 27 deletions(-)

diff --git a/dimos/agents/vlm_agent.py b/dimos/agents/vlm_agent.py
index b523cfbaf8..0b99fe4d1c 100644
--- a/dimos/agents/vlm_agent.py
+++ b/dimos/agents/vlm_agent.py
@@ -14,7 +14,7 @@
 
 from typing import Any
 
-from langchain_core.messages import AIMessage, HumanMessage, SystemMessage
+from langchain_core.messages import AIMessage, HumanMessage
 
 from dimos.agents.llm_init import build_llm, build_system_message
 from dimos.agents.spec import AgentSpec, AnyMessage
diff --git a/dimos/control/blueprints.py b/dimos/control/blueprints.py
index 5cbc109ece..d38ac1f81f 100644
--- a/dimos/control/blueprints.py
+++ b/dimos/control/blueprints.py
@@ -38,7 +38,6 @@
 from __future__ import annotations
 
 from dimos.control.orchestrator import (
-    ControlOrchestrator,
     HardwareConfig,
     TaskConfig,
     control_orchestrator,
diff --git a/dimos/control/hardware_interface.py b/dimos/control/hardware_interface.py
index e4fba70e1c..ef62f974c6 100644
--- a/dimos/control/hardware_interface.py
+++ b/dimos/control/hardware_interface.py
@@ -24,7 +24,7 @@
 
 import logging
 import time
-from typing import TYPE_CHECKING, Protocol, runtime_checkable
+from typing import Protocol, runtime_checkable
 
 from dimos.hardware.manipulators.spec import ControlMode, ManipulatorBackend
 
diff --git a/dimos/control/orchestrator.py b/dimos/control/orchestrator.py
index e7ea147dcf..2d64620b13 100644
--- a/dimos/control/orchestrator.py
+++ b/dimos/control/orchestrator.py
@@ -27,7 +27,6 @@
 
 from __future__ import annotations
 
-from collections.abc import Callable
 from dataclasses import dataclass, field
 import threading
 import time
diff --git a/dimos/models/vl/test_vlm.py b/dimos/models/vl/test_vlm.py
index 120dfb74fb..741e0dede2 100644
--- a/dimos/models/vl/test_vlm.py
+++ b/dimos/models/vl/test_vlm.py
@@ -1,3 +1,4 @@
+import os
 import time
 from typing import TYPE_CHECKING
 
@@ -5,7 +6,6 @@
     ImageAnnotations,
 )
 import pytest
-import os
 
 from dimos.core import LCMTransport
 from dimos.models.vl.moondream import MoondreamVlModel
diff --git a/dimos/navigation/frontier_exploration/test_wavefront_frontier_goal_selector.py b/dimos/navigation/frontier_exploration/test_wavefront_frontier_goal_selector.py
index 20597dc87b..1c8082b414 100644
--- a/dimos/navigation/frontier_exploration/test_wavefront_frontier_goal_selector.py
+++ b/dimos/navigation/frontier_exploration/test_wavefront_frontier_goal_selector.py
@@ -15,12 +15,10 @@
 import time
 
 import numpy as np
-from PIL import ImageDraw
 import pytest
 
 from dimos.msgs.geometry_msgs import Vector3
 from dimos.msgs.nav_msgs import CostValues, OccupancyGrid
-from dimos.navigation.frontier_exploration.utils import costmap_to_pil_image
 from dimos.navigation.frontier_exploration.wavefront_frontier_goal_selector import (
     WavefrontFrontierExplorer,
 )
diff --git a/dimos/perception/experimental/temporal_memory/temporal_memory.py b/dimos/perception/experimental/temporal_memory/temporal_memory.py
index a328186173..29d4ecf3d9 100644
--- a/dimos/perception/experimental/temporal_memory/temporal_memory.py
+++ b/dimos/perception/experimental/temporal_memory/temporal_memory.py
@@ -44,7 +44,6 @@
 from .clip_filter import (
     CLIP_AVAILABLE,
     adaptive_keyframes,
-    select_diverse_frames_simple,
 )
 
 try:
diff --git a/dimos/perception/experimental/temporal_memory/temporal_memory_example.py b/dimos/perception/experimental/temporal_memory/temporal_memory_example.py
index df435df3cc..8ba28bb174 100644
--- a/dimos/perception/experimental/temporal_memory/temporal_memory_example.py
+++ b/dimos/perception/experimental/temporal_memory/temporal_memory_example.py
@@ -22,7 +22,6 @@
 3. Query the temporal memory about entities and events
 """
 
-import os
 from pathlib import Path
 
 from dotenv import load_dotenv
diff --git a/dimos/perception/experimental/temporal_memory/temporal_utils/graph_utils.py b/dimos/perception/experimental/temporal_memory/temporal_utils/graph_utils.py
index bc55f7c65c..315d267a0c 100644
--- a/dimos/perception/experimental/temporal_memory/temporal_utils/graph_utils.py
+++ b/dimos/perception/experimental/temporal_memory/temporal_utils/graph_utils.py
@@ -15,7 +15,6 @@
 """Graph database utility functions for temporal memory."""
 
 import re
-import time
 from typing import TYPE_CHECKING, Any
 
 from dimos.utils.logging_config import setup_logger
diff --git a/dimos/protocol/pubsub/benchmark/type.py b/dimos/protocol/pubsub/benchmark/type.py
index d27da2fde6..79101df9c5 100644
--- a/dimos/protocol/pubsub/benchmark/type.py
+++ b/dimos/protocol/pubsub/benchmark/type.py
@@ -17,20 +17,9 @@
 from collections.abc import Callable, Iterator, Sequence
 from contextlib import AbstractContextManager
 from dataclasses import dataclass, field
-import pickle
-import threading
-import time
-from typing import Any, Generic, TypeVar
-
-import pytest
-
-from dimos.msgs.geometry_msgs import Vector3
-from dimos.msgs.sensor_msgs.Image import Image
-from dimos.protocol.pubsub.lcmpubsub import LCM, Topic
-from dimos.protocol.pubsub.memory import Memory
-from dimos.protocol.pubsub.shmpubsub import PickleSharedMemory
+from typing import Any, Generic
+
 from dimos.protocol.pubsub.spec import MsgT, PubSub, TopicT
-from dimos.utils.data import get_data
 
 MsgGen = Callable[[int], tuple[TopicT, MsgT]]
 
diff --git a/dimos/protocol/pubsub/test_rospubsub.py b/dimos/protocol/pubsub/test_rospubsub.py
index b536f95abe..3a3a020586 100644
--- a/dimos/protocol/pubsub/test_rospubsub.py
+++ b/dimos/protocol/pubsub/test_rospubsub.py
@@ -14,7 +14,6 @@
 
 from collections.abc import Generator
 import threading
-import time
 
 from dimos_lcm.geometry_msgs import PointStamped
 import numpy as np
diff --git a/dimos/robot/drone/test_drone.py b/dimos/robot/drone/test_drone.py
index 6433f77ec5..bfbaa9ed54 100644
--- a/dimos/robot/drone/test_drone.py
+++ b/dimos/robot/drone/test_drone.py
@@ -24,7 +24,6 @@
 from unittest.mock import MagicMock, patch
 
 import numpy as np
-import pytest
 
 from dimos.msgs.geometry_msgs import PoseStamped, Quaternion, Vector3
 from dimos.msgs.sensor_msgs import Image, ImageFormat
diff --git a/dimos/robot/unitree_webrtc/modular/detect.py b/dimos/robot/unitree_webrtc/modular/detect.py
index 64e3bbe30a..8f92d15e81 100644
--- a/dimos/robot/unitree_webrtc/modular/detect.py
+++ b/dimos/robot/unitree_webrtc/modular/detect.py
@@ -141,7 +141,6 @@ def process_data():  # type: ignore[no-untyped-def]
         Detection2DModule,
         build_imageannotations,
     )
-    from dimos.robot.unitree_webrtc.type.lidar import pointcloud2_from_webrtc_lidar
     from dimos.robot.unitree_webrtc.type.odometry import Odometry
     from dimos.utils.data import get_data
     from dimos.utils.testing import TimedSensorReplay
diff --git a/dimos/robot/unitree_webrtc/unitree_go2_blueprints.py b/dimos/robot/unitree_webrtc/unitree_go2_blueprints.py
index 0d23b839bd..b683b76559 100644
--- a/dimos/robot/unitree_webrtc/unitree_go2_blueprints.py
+++ b/dimos/robot/unitree_webrtc/unitree_go2_blueprints.py
@@ -45,7 +45,6 @@
 from dimos.mapping.costmapper import cost_mapper
 from dimos.mapping.voxels import voxel_mapper
 from dimos.msgs.geometry_msgs import PoseStamped
-from dimos.msgs.nav_msgs import OccupancyGrid
 from dimos.msgs.sensor_msgs import Image, PointCloud2
 from dimos.msgs.vision_msgs import Detection2DArray
 from dimos.navigation.frontier_exploration import (

From d8112a43541f67c0452ccdd50b5a81c4b80086a8 Mon Sep 17 00:00:00 2001
From: Paul Nechifor <paul@nechifor.net>
Date: Wed, 21 Jan 2026 07:05:22 +0200
Subject: [PATCH 3/4] remove cuda sharpness test

---
 dimos/msgs/sensor_msgs/image_impls/test_image_backends.py | 8 +-------
 1 file changed, 1 insertion(+), 7 deletions(-)

diff --git a/dimos/msgs/sensor_msgs/image_impls/test_image_backends.py b/dimos/msgs/sensor_msgs/image_impls/test_image_backends.py
index d3a5bf91e2..7951a095b3 100644
--- a/dimos/msgs/sensor_msgs/image_impls/test_image_backends.py
+++ b/dimos/msgs/sensor_msgs/image_impls/test_image_backends.py
@@ -221,19 +221,13 @@ def test_perf_alloc(alloc_timer) -> None:
 def test_sharpness(alloc_timer) -> None:
     """Test sharpness computation with NumpyImage always, add CudaImage parity when available."""
     arr = _prepare_image(ImageFormat.BGR, (64, 64, 3))
-    cpu, gpu, _, _ = alloc_timer(arr, ImageFormat.BGR)
+    cpu = alloc_timer(arr, ImageFormat.BGR)[0]
 
     # Always test CPU backend
     s_cpu = cpu.sharpness
     assert s_cpu >= 0  # Sharpness should be non-negative
     assert s_cpu < 1000  # Reasonable upper bound
 
-    # Optionally test GPU parity when CUDA is available
-    if gpu is not None:
-        s_gpu = gpu.sharpness
-        # Values should be very close; minor border/rounding differences allowed
-        assert abs(s_cpu - s_gpu) < 5e-2
-
 
 def test_to_opencv(alloc_timer) -> None:
     """Test to_opencv conversion with NumpyImage always, add CudaImage parity when available."""

From 37a7d7787030bc32e7c5f0218d39201d77101dd8 Mon Sep 17 00:00:00 2001
From: Paul Nechifor <paul@nechifor.net>
Date: Wed, 21 Jan 2026 07:29:38 +0200
Subject: [PATCH 4/4] PYTHONWARNINGS

---
 pyproject.toml | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index f3752d0894..78ee5c51a4 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -358,7 +358,8 @@ markers = [
     "mujoco: tests which open mujoco",
 ]
 env = [
-  "GOOGLE_MAPS_API_KEY=AIzafake_google_key"
+  "GOOGLE_MAPS_API_KEY=AIzafake_google_key",
+  "PYTHONWARNINGS=ignore:cupyx.jit.rawkernel is experimental:FutureWarning",
 ]
 addopts = "-v -p no:warnings -ra --color=yes -m 'not (vis or exclude or tool or lcm or ros or heavy or gpu or module or tofix or e2e or integration or neverending or mujoco)'"
 asyncio_mode = "auto"