From a927537833ae355209cae512dd1b124bc61a7b93 Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Mon, 30 Mar 2026 11:56:09 +0700
Subject: [PATCH 01/16] feat: update executable path

---
 setup.cfg | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/setup.cfg b/setup.cfg
index 8a56203..ba5dc02 100644
--- a/setup.cfg
+++ b/setup.cfg
@@ -1,5 +1,5 @@
 [build_scripts]
-executable=/usr/bin/env python3
+executable=/home/group11/final_project_ws/real_vision_venv/bin/python3
 [develop]
 script_dir=$base/lib/vision
 [install]

From 0721e7700a95d50f2be0ab8aee0455dd3b2f3aed Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Mon, 30 Mar 2026 11:57:12 +0700
Subject: [PATCH 02/16] feat: fix clip visualization

---
 vision/clip_classifier.py | 42 +++++++++++++++++++++++++++++----------
 1 file changed, 32 insertions(+), 10 deletions(-)

diff --git a/vision/clip_classifier.py b/vision/clip_classifier.py
index 8bc0eb3..b0d654b 100755
--- a/vision/clip_classifier.py
+++ b/vision/clip_classifier.py
@@ -51,6 +51,7 @@
 import cv2
 import numpy as np
 import sys
+import os
 import json
 from datetime import datetime
 from typing import List, Dict, Tuple, Optional
@@ -277,8 +278,12 @@ def __init__(self, candidate_labels: List[str] = None):
             )
             self.get_logger().warn("Subscribing to: /vision/sam_detections (placeholder Image). Build msgs for full integration.")
         
+        # Mitigate OpenCV Qt backend font path issues in virtual environments.
+        self._configure_opencv_qt_fonts()
+
         # OpenCV window setup
         self.window_name = f"CLIP Classifier - {self.rgb_topic}"
+        cv2.startWindowThread()
         cv2.namedWindow(self.window_name, cv2.WINDOW_NORMAL)
         cv2.resizeWindow(self.window_name, 800, 600)
         
@@ -300,6 +305,29 @@ def __init__(self, candidate_labels: List[str] = None):
         self.get_logger().info("Service: /vision/find_multi_object")
         self.get_logger().info(f"Subscriber: /vision/sam_detections (auto-classify on SAM publish)")
         self.get_logger().info(f"OpenCV Window: '{self.window_name}'")
+
+    def _configure_opencv_qt_fonts(self):
+        """Set a valid Qt font directory when OpenCV's bundled qt/fonts folder is missing."""
+        if os.environ.get('QT_QPA_FONTDIR'):
+            return
+
+        candidate_dirs = [
+            '/usr/share/fonts/truetype/dejavu',
+            '/usr/share/fonts/truetype/freefont',
+            '/usr/share/fonts/truetype/liberation2',
+            '/usr/share/fonts',
+        ]
+
+        for font_dir in candidate_dirs:
+            if os.path.isdir(font_dir):
+                os.environ['QT_QPA_FONTDIR'] = font_dir
+                self.get_logger().info(f"Set QT_QPA_FONTDIR to {font_dir}")
+                return
+
+        self.get_logger().warn(
+            "Could not find a system font directory for QT_QPA_FONTDIR. "
+            "OpenCV Qt warnings may appear."
+        )
     
     def _init_clip_model(self):
         """Initialize CLIP model"""
@@ -1548,16 +1576,10 @@ def main(args=None):
     
     try:
         node = CLIPClassifier(candidate_labels=candidate_labels)
-        
-        # Use MultiThreadedExecutor for ReentrantCallbackGroup
-        executor = MultiThreadedExecutor()
-        executor.add_node(node)
-        
-        try:
-            executor.spin()
-        finally:
-            executor.shutdown()
-            node.destroy_node()
+
+        # Keep OpenCV HighGUI operations on the main thread for stable rendering.
+        rclpy.spin(node)
+        node.destroy_node()
     except KeyboardInterrupt:
         pass
     finally:

From 48c3d541b6528450426b6877d39f0db128918aa9 Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Mon, 30 Mar 2026 18:20:21 +0700
Subject: [PATCH 03/16] fix: obb not receiving SAM detections

---
 vision/clip_classifier.py        |  42 +++--------
 vision/obb_angle_service_node.py | 115 ++++++++++++++++++++++++-------
 2 files changed, 101 insertions(+), 56 deletions(-)

diff --git a/vision/clip_classifier.py b/vision/clip_classifier.py
index b0d654b..8bc0eb3 100755
--- a/vision/clip_classifier.py
+++ b/vision/clip_classifier.py
@@ -51,7 +51,6 @@
 import cv2
 import numpy as np
 import sys
-import os
 import json
 from datetime import datetime
 from typing import List, Dict, Tuple, Optional
@@ -278,12 +277,8 @@ def __init__(self, candidate_labels: List[str] = None):
             )
             self.get_logger().warn("Subscribing to: /vision/sam_detections (placeholder Image). Build msgs for full integration.")
         
-        # Mitigate OpenCV Qt backend font path issues in virtual environments.
-        self._configure_opencv_qt_fonts()
-
         # OpenCV window setup
         self.window_name = f"CLIP Classifier - {self.rgb_topic}"
-        cv2.startWindowThread()
         cv2.namedWindow(self.window_name, cv2.WINDOW_NORMAL)
         cv2.resizeWindow(self.window_name, 800, 600)
         
@@ -305,29 +300,6 @@ def __init__(self, candidate_labels: List[str] = None):
         self.get_logger().info("Service: /vision/find_multi_object")
         self.get_logger().info(f"Subscriber: /vision/sam_detections (auto-classify on SAM publish)")
         self.get_logger().info(f"OpenCV Window: '{self.window_name}'")
-
-    def _configure_opencv_qt_fonts(self):
-        """Set a valid Qt font directory when OpenCV's bundled qt/fonts folder is missing."""
-        if os.environ.get('QT_QPA_FONTDIR'):
-            return
-
-        candidate_dirs = [
-            '/usr/share/fonts/truetype/dejavu',
-            '/usr/share/fonts/truetype/freefont',
-            '/usr/share/fonts/truetype/liberation2',
-            '/usr/share/fonts',
-        ]
-
-        for font_dir in candidate_dirs:
-            if os.path.isdir(font_dir):
-                os.environ['QT_QPA_FONTDIR'] = font_dir
-                self.get_logger().info(f"Set QT_QPA_FONTDIR to {font_dir}")
-                return
-
-        self.get_logger().warn(
-            "Could not find a system font directory for QT_QPA_FONTDIR. "
-            "OpenCV Qt warnings may appear."
-        )
     
     def _init_clip_model(self):
         """Initialize CLIP model"""
@@ -1576,10 +1548,16 @@ def main(args=None):
     
     try:
         node = CLIPClassifier(candidate_labels=candidate_labels)
-
-        # Keep OpenCV HighGUI operations on the main thread for stable rendering.
-        rclpy.spin(node)
-        node.destroy_node()
+        
+        # Use MultiThreadedExecutor for ReentrantCallbackGroup
+        executor = MultiThreadedExecutor()
+        executor.add_node(node)
+        
+        try:
+            executor.spin()
+        finally:
+            executor.shutdown()
+            node.destroy_node()
     except KeyboardInterrupt:
         pass
     finally:
diff --git a/vision/obb_angle_service_node.py b/vision/obb_angle_service_node.py
index 9bdf7d6..f205cf5 100644
--- a/vision/obb_angle_service_node.py
+++ b/vision/obb_angle_service_node.py
@@ -37,6 +37,7 @@
 from rclpy.node import Node
 from rclpy.callback_groups import ReentrantCallbackGroup
 from rclpy.executors import MultiThreadedExecutor
+from rclpy.qos import QoSProfile, ReliabilityPolicy, DurabilityPolicy
 from custom_interfaces.srv import FindObjectAngleBB, FindObjectAngle, DetectObjects
 from custom_interfaces.msg import SAMDetections
 from sensor_msgs.msg import Image, CameraInfo
@@ -44,6 +45,7 @@
 import numpy as np
 import cv2
 import time
+import threading
 
 
 class OBBAngleServiceNode(Node):
@@ -55,8 +57,10 @@ class OBBAngleServiceNode(Node):
     def __init__(self):
         super().__init__('obb_angle_service_node')
         
-        # Use reentrant callback group for nested service calls
-        self.callback_group = ReentrantCallbackGroup()
+        # Keep subscriptions and services in separate callback groups so
+        # detection updates can be processed while service callbacks are waiting.
+        self.subscription_callback_group = ReentrantCallbackGroup()
+        self.service_callback_group = ReentrantCallbackGroup()
         
         # Storage for latest detections and images
         self.latest_detections = None
@@ -66,8 +70,13 @@ def __init__(self):
         self.bridge = CvBridge()
         
         # Thread lock for thread-safe access
-        import threading
         self.detections_lock = threading.Lock()
+        self.detections_condition = threading.Condition(self.detections_lock)
+        self.latest_detections_stamp_ns = 0
+
+        # Queue visualization work so service callbacks can return immediately.
+        self.viz_lock = threading.Lock()
+        self.pending_viz = None
         
         # OpenCV visualization window (unified for both single and multi-object)
         self.window_name = 'OBB Angle Detection'
@@ -80,13 +89,21 @@ def __init__(self):
             self.rgb_topic = '/camera/color/image_raw'
         else:
             self.rgb_topic = '/camera/image_raw'
+
+        # Best-effort QoS is generally more compatible with high-rate detector topics.
+        self.sam_qos = QoSProfile(
+            depth=10,
+            reliability=ReliabilityPolicy.BEST_EFFORT,
+            durability=DurabilityPolicy.VOLATILE,
+        )
         
         # Subscribe to RGB camera for visualization
         self.rgb_subscription = self.create_subscription(
             Image,
             self.rgb_topic,
             self.rgb_callback,
-            10
+            10,
+            callback_group=self.subscription_callback_group,
         )
         
         # Subscribe to SAM detections for multi-object OBB
@@ -94,7 +111,8 @@ def __init__(self):
             SAMDetections,
             '/vision/sam_detections',
             self.sam_detections_callback,
-            10
+            self.sam_qos,
+            callback_group=self.subscription_callback_group,
         )
         
         # Subscribe to depth camera
@@ -102,7 +120,8 @@ def __init__(self):
             Image,
             "/camera/depth/image_rect_raw",
             self.depth_callback,
-            10
+            10,
+            callback_group=self.subscription_callback_group,
         )
         
         # Subscribe to camera info
@@ -110,14 +129,15 @@ def __init__(self):
             CameraInfo,
             "/camera/color/camera_info",
             self.info_callback,
-            10
+            10,
+            callback_group=self.subscription_callback_group,
         )
         
         # Service client for real-time detection
         self.detect_objects_client = self.create_client(
             DetectObjects,
             '/vision/detect_objects',
-            callback_group=self.callback_group
+            callback_group=self.service_callback_group
         )
         
         # Create OBB angle service servers
@@ -125,14 +145,14 @@ def __init__(self):
             FindObjectAngleBB,
             '/obb/find_object_angle_bb',
             self.find_object_angle_bb_callback,
-            callback_group=self.callback_group
+            callback_group=self.service_callback_group
         )
         
         self.find_object_angle_srv = self.create_service(
             FindObjectAngle,
             '/obb/find_object_angle',
             self.find_object_angle_callback,
-            callback_group=self.callback_group
+            callback_group=self.service_callback_group
         )
         
         # Create OpenCV window (unified)
@@ -152,6 +172,7 @@ def __init__(self):
         self.get_logger().info('  - /obb/find_object_angle (All objects OBB)')
         self.get_logger().info('Subscriptions:')
         self.get_logger().info('  - /vision/sam_detections (SAMDetections)')
+        self.get_logger().info('  - /vision/sam_detections QoS: BEST_EFFORT, VOLATILE, depth=10')
         self.get_logger().info(f'  - {self.rgb_topic} (Image)')
         self.get_logger().info('  - /camera/depth/image_rect_raw (Image)')
         self.get_logger().info('  - /camera/color/camera_info (CameraInfo)')
@@ -177,9 +198,28 @@ def rgb_callback(self, msg: Image):
     
     def sam_detections_callback(self, msg: SAMDetections):
         """Store latest SAM detections"""
-        with self.detections_lock:
+        with self.detections_condition:
             self.latest_detections = msg
+            self.latest_detections_stamp_ns = time.monotonic_ns()
+            self.detections_condition.notify_all()
+            if not hasattr(self, '_sam_received'):
+                self._sam_received = True
+                self.get_logger().info(f'First SAM detections received: {msg.total_detections} objects')
             self.get_logger().debug(f'Received SAM detections: {msg.total_detections} objects')
+
+    def wait_for_sam_detections(self, timeout_sec=1.5, min_stamp_ns=0):
+        """Wait until at least one SAM detection message is available."""
+        deadline = time.monotonic() + timeout_sec
+        with self.detections_condition:
+            while True:
+                if self.latest_detections is not None and self.latest_detections_stamp_ns >= min_stamp_ns:
+                    return True
+
+                remaining = deadline - time.monotonic()
+                if remaining <= 0.0:
+                    return False
+
+                self.detections_condition.wait(timeout=min(0.05, remaining))
     
     def depth_callback(self, msg: Image):
         """Store latest depth image"""
@@ -194,9 +234,28 @@ def info_callback(self, msg: CameraInfo):
     
     def keep_window_alive(self):
         """Timer callback to keep OpenCV window responsive"""
-        # This just calls waitKey to process window events
-        # Without this, the window may freeze or not display properly
-        cv2.waitKey(1)
+        # Render queued visualization outside service callbacks to avoid
+        # blocking service responses on GUI operations.
+        pending = None
+        with self.viz_lock:
+            if self.pending_viz is not None:
+                pending = self.pending_viz
+                self.pending_viz = None
+
+        if pending is not None:
+            results, mode = pending
+            try:
+                self.visualize_obb(results, mode=mode)
+            except Exception as e:
+                self.get_logger().warn(f'Visualization update failed: {e}')
+        else:
+            # Process window events even when no new frame is queued.
+            cv2.waitKey(1)
+
+    def queue_visualization(self, results, mode="auto"):
+        """Queue the latest visualization payload for timer-based rendering."""
+        with self.viz_lock:
+            self.pending_viz = (results, mode)
     
     def calculate_obb_from_bbox(self, x1, y1, x2, y2, mask=None):
         """
@@ -552,11 +611,15 @@ def find_object_angle_bb_callback(self, request, response):
                 return response
             
             # Trigger real-time detection to get fresh detections
+            request_stamp_ns = time.monotonic_ns()
             self.get_logger().info('Triggering real-time detection...')
             detection_success = self.trigger_real_time_detection()
-            
-            # Small delay to ensure detections are updated
-            time.sleep(0.1)
+            min_stamp_ns = request_stamp_ns if detection_success else 0
+
+            # Wait for SAM callback instead of fixed sleep.
+            got_sam = self.wait_for_sam_detections(timeout_sec=1.5, min_stamp_ns=min_stamp_ns)
+            if not got_sam:
+                self.get_logger().warn('Timed out waiting for SAM detections update')
             
             # Get latest detections
             with self.detections_lock:
@@ -649,9 +712,9 @@ def find_object_angle_bb_callback(self, request, response):
             self.get_logger().info(f'OBB Result ({best_detection.object_id}): center=({u:.1f},{v:.1f}), angle={angle_deg:.1f}deg, size={width:.0f}x{height:.0f}')
             self.get_logger().info('=' * 60)
             
-            # Visualize with unified function - pass the INPUT bbox from request for visualization
+            # Queue visualization; do not block service response path.
             viz_data = [(best_detection.object_id, u, v, theta_geom, width, height, [request.x1, request.y1, request.x2, request.y2])]
-            self.visualize_obb(viz_data, mode="single")
+            self.queue_visualization(viz_data, mode="single")
             
         except Exception as e:
             self.get_logger().error(f'Error in find_object_angle_bb: {e}')
@@ -678,11 +741,15 @@ def find_object_angle_callback(self, request, response):
         
         try:
             # Trigger real-time detection
+            request_stamp_ns = time.monotonic_ns()
             self.get_logger().info('Triggering real-time detection for all objects...')
             detection_success = self.trigger_real_time_detection()
-            
-            # Small delay to ensure detections are updated
-            time.sleep(0.1)
+            min_stamp_ns = request_stamp_ns if detection_success else 0
+
+            # Wait for SAM callback instead of fixed sleep.
+            got_sam = self.wait_for_sam_detections(timeout_sec=1.5, min_stamp_ns=min_stamp_ns)
+            if not got_sam:
+                self.get_logger().warn('Timed out waiting for SAM detections update')
             
             # Get latest detections
             with self.detections_lock:
@@ -791,7 +858,7 @@ def find_object_angle_callback(self, request, response):
             
             # Visualize all objects with unified function
             if len(viz_results) > 0:
-                self.visualize_obb(viz_results, mode="multi")
+                self.queue_visualization(viz_results, mode="multi")
             
         except Exception as e:
             self.get_logger().error(f'Error in find_object_angle: {e}')
@@ -822,7 +889,7 @@ def main(args=None):
     node = OBBAngleServiceNode()
     
     # Use MultiThreadedExecutor for non-blocking service calls
-    executor = MultiThreadedExecutor()
+    executor = MultiThreadedExecutor(num_threads=4)
     executor.add_node(node)
     
     try:

From a4d790f3e7c8545a37fe0d1bbc5f3efeac35c3bd Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Mon, 30 Mar 2026 18:48:35 +0700
Subject: [PATCH 04/16] fix: clip and obb visualization

---
 vision/clip_classifier.py        | 11 +++++++----
 vision/obb_angle_service_node.py | 10 +++++++---
 2 files changed, 14 insertions(+), 7 deletions(-)

diff --git a/vision/clip_classifier.py b/vision/clip_classifier.py
index 8bc0eb3..897094e 100755
--- a/vision/clip_classifier.py
+++ b/vision/clip_classifier.py
@@ -282,8 +282,9 @@ def __init__(self, candidate_labels: List[str] = None):
         cv2.namedWindow(self.window_name, cv2.WINDOW_NORMAL)
         cv2.resizeWindow(self.window_name, 800, 600)
         
-        # Timer for visualization (30 Hz)
-        self.viz_timer = self.create_timer(0.033, self.visualization_callback)
+        # GUI updates are pumped from the main thread in main() to avoid
+        # HighGUI freezes under multi-threaded executors.
+        self.viz_timer = None
         
         self.get_logger().info("CLIP Classifier Started")
         self.get_logger().info(f"Subscribing to: {self.rgb_topic}")
@@ -1550,11 +1551,13 @@ def main(args=None):
         node = CLIPClassifier(candidate_labels=candidate_labels)
         
         # Use MultiThreadedExecutor for ReentrantCallbackGroup
-        executor = MultiThreadedExecutor()
+        executor = MultiThreadedExecutor(num_threads=4)
         executor.add_node(node)
         
         try:
-            executor.spin()
+            while rclpy.ok():
+                executor.spin_once(timeout_sec=0.03)
+                node.visualization_callback()
         finally:
             executor.shutdown()
             node.destroy_node()
diff --git a/vision/obb_angle_service_node.py b/vision/obb_angle_service_node.py
index f205cf5..41b36cd 100644
--- a/vision/obb_angle_service_node.py
+++ b/vision/obb_angle_service_node.py
@@ -159,8 +159,9 @@ def __init__(self):
         cv2.namedWindow(self.window_name, cv2.WINDOW_NORMAL)
         cv2.resizeWindow(self.window_name, 1200, 800)
         
-        # Create timer for continuous window update (keeps window responsive)
-        self.viz_timer = self.create_timer(0.1, self.keep_window_alive)
+        # GUI updates are pumped from the main thread in main() to avoid
+        # HighGUI freezes under multi-threaded executors.
+        self.viz_timer = None
         
         self.get_logger().info('=' * 80)
         self.get_logger().info('OBB Angle Service Node Started')
@@ -894,10 +895,13 @@ def main(args=None):
     
     try:
         node.get_logger().info('OBB Angle Service Node spinning...')
-        executor.spin()
+        while rclpy.ok():
+            executor.spin_once(timeout_sec=0.03)
+            node.keep_window_alive()
     except KeyboardInterrupt:
         node.get_logger().info('Shutting down OBB Angle Service Node...')
     finally:
+        executor.shutdown()
         cv2.destroyAllWindows()
         node.destroy_node()
         rclpy.shutdown()

From 1bc315ada03ae44bc7cb0685db01c248c7b183be Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Fri, 3 Apr 2026 10:20:16 +0700
Subject: [PATCH 05/16] feat: update camera position

---
 vision/pixel_to_real_world.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/vision/pixel_to_real_world.py b/vision/pixel_to_real_world.py
index a0be114..10dab48 100644
--- a/vision/pixel_to_real_world.py
+++ b/vision/pixel_to_real_world.py
@@ -51,10 +51,12 @@ def __init__(self):
         #   error = (x - x^, y - y^, z - z^)
         #   t_base_cam_new = t_base_cam_old + error
         # This compensates for calibration errors in the camera position.
+        # Practically: put the silver tip of the tape measure where the center of the gripper is, read the distance to the center of the cube
+        # see what direction (- or +) the read is, add that
         # Benchmark:
         # LOW: (-0.0386, 0.5303, 0.5238)
         # HIGH: (-0.0361, 0.5303, 0.6458)
-        self.t_base_cam = np.array([-0.0361, 0.5303, 0.6458])
+        self.t_base_cam = np.array([-0.146, 0.635, 0.8])
 
         self.R_base_cam = np.array([
             [1.0,  0.0,  0.0],

From f698985792d76428021566bba9d7de0d084be8f0 Mon Sep 17 00:00:00 2001
From: Methasit-Pun <methasitpun@gmail.com>
Date: Fri, 3 Apr 2026 23:15:33 +0700
Subject: [PATCH 06/16] feat: improve dashboard logic

---
 dashboard/index.html                 | 1665 ++++++++++++++++----------
 docs/COLLECT_AND_EXPORT.md           |  264 ++++
 setup.py                             |    2 +
 vision/benchmark_dashboard.py        |   11 +
 vision_scripts/collect_and_export.py |  497 ++++++++
 5 files changed, 1838 insertions(+), 601 deletions(-)
 create mode 100644 docs/COLLECT_AND_EXPORT.md
 create mode 100644 vision_scripts/collect_and_export.py

diff --git a/dashboard/index.html b/dashboard/index.html
index f8d2cfa..1071733 100644
--- a/dashboard/index.html
+++ b/dashboard/index.html
@@ -3,745 +3,1208 @@
 <head>
     <meta charset="UTF-8">
     <meta name="viewport" content="width=device-width, initial-scale=1.0">
-    <title>Vision Benchmark Dashboard</title>
+    <title>Vision Pipeline Research Dashboard</title>
     <style>
-        * {
-            margin: 0;
-            padding: 0;
-            box-sizing: border-box;
+        /* ── Design tokens ───────────────────────────────────────────── */
+        :root {
+            --bg:            #f1f5f9;
+            --surface:       #ffffff;
+            --border:        #e2e8f0;
+            --text-primary:  #0f172a;
+            --text-secondary:#64748b;
+            --text-muted:    #94a3b8;
+
+            --color-runs:      #3b82f6;
+            --color-sam:       #8b5cf6;
+            --color-clip:      #ec4899;
+            --color-grasp:     #f59e0b;
+            --color-scene:     #10b981;
+            --color-pixel:     #06b6d4;
+            --color-objects:   #6366f1;
+            --color-relations: #14b8a6;
+
+            --ok:   #22c55e;
+            --warn: #f59e0b;
+            --fail: #ef4444;
+
+            --nav-bg:   #0f172a;
+            --nav-text: #94a3b8;
+
+            --radius:    10px;
+            --radius-sm: 6px;
+            --shadow:    0 1px 3px rgba(0,0,0,.08), 0 1px 2px rgba(0,0,0,.05);
+            --shadow-md: 0 4px 6px rgba(0,0,0,.07), 0 2px 4px rgba(0,0,0,.05);
         }
 
+        *, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
+
         body {
-            font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
-            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
-            padding: 20px;
+            font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', sans-serif;
+            background: var(--bg);
+            color: var(--text-primary);
+            font-size: 14px;
+            line-height: 1.5;
+            display: flex;
             min-height: 100vh;
         }
 
-        .container {
-            max-width: 1800px;
-            margin: 0 auto;
+        /* ── Sidebar ─────────────────────────────────────────────────── */
+        #sidebar {
+            width: 226px;
+            min-width: 226px;
+            background: var(--nav-bg);
+            position: fixed;
+            top: 0; left: 0;
+            height: 100vh;
+            z-index: 100;
+            display: flex;
+            flex-direction: column;
+            overflow-y: auto;
         }
 
-        header {
-            background: white;
-            padding: 30px;
-            border-radius: 15px;
-            box-shadow: 0 10px 30px rgba(0,0,0,0.2);
-            margin-bottom: 30px;
-            text-align: center;
+        .sb-brand {
+            padding: 22px 18px 16px;
+            border-bottom: 1px solid rgba(255,255,255,.07);
         }
-
-        h1 {
-            color: #667eea;
-            font-size: 2.5em;
-            margin-bottom: 10px;
+        .sb-brand-title {
+            font-size: 13px;
+            font-weight: 700;
+            color: #fff;
+            line-height: 1.35;
+            letter-spacing: .2px;
         }
-
-        .subtitle {
-            color: #666;
-            font-size: 1.1em;
+        .sb-brand-sub {
+            font-size: 11px;
+            color: var(--nav-text);
+            margin-top: 4px;
         }
 
-        .stats-bar {
+        .sb-live {
             display: flex;
-            gap: 20px;
-            margin-bottom: 30px;
-            flex-wrap: wrap;
+            align-items: center;
+            gap: 8px;
+            padding: 9px 18px;
+            border-bottom: 1px solid rgba(255,255,255,.07);
+            font-size: 11px;
+            color: var(--nav-text);
         }
-
-        .stat-card {
-            flex: 1;
-            min-width: 200px;
-            background: white;
-            padding: 20px;
-            border-radius: 10px;
-            box-shadow: 0 5px 15px rgba(0,0,0,0.1);
-            text-align: center;
+        .live-dot {
+            width: 7px; height: 7px;
+            border-radius: 50%;
+            background: var(--ok);
+            animation: pulse 2s infinite;
+            flex-shrink: 0;
         }
-
-        .stat-number {
-            font-size: 2.5em;
-            font-weight: bold;
-            color: #667eea;
-            margin-bottom: 5px;
+        @keyframes pulse {
+            0%,100% { opacity:1; transform:scale(1); }
+            50%      { opacity:.45; transform:scale(.8); }
         }
 
-        .stat-label {
-            color: #666;
-            font-size: 0.9em;
+        .sb-group {
+            font-size: 10px;
+            font-weight: 700;
             text-transform: uppercase;
-            letter-spacing: 1px;
-        }
-
-        .section {
-            background: white;
-            padding: 30px;
-            border-radius: 15px;
-            box-shadow: 0 10px 30px rgba(0,0,0,0.2);
-            margin-bottom: 30px;
+            letter-spacing: 1.1px;
+            color: rgba(255,255,255,.22);
+            padding: 16px 18px 6px;
         }
 
-        .section-header {
+        .sb-link {
             display: flex;
-            justify-content: space-between;
             align-items: center;
-            margin-bottom: 20px;
-            padding-bottom: 15px;
-            border-bottom: 3px solid #667eea;
-        }
-
-        h2 {
-            color: #333;
-            font-size: 1.8em;
-        }
-
-        .badge {
-            background: #667eea;
-            color: white;
-            padding: 8px 20px;
-            border-radius: 20px;
-            font-size: 0.9em;
-            font-weight: bold;
+            gap: 10px;
+            padding: 8px 18px;
+            color: var(--nav-text);
+            font-size: 12.5px;
+            font-weight: 500;
+            cursor: pointer;
+            border-left: 3px solid transparent;
+            transition: background .12s, color .12s;
+            user-select: none;
         }
+        .sb-link:hover { background: rgba(255,255,255,.06); color: #fff; }
 
-        table {
-            width: 100%;
-            border-collapse: collapse;
-            margin-top: 15px;
+        .sb-dot {
+            width: 8px; height: 8px;
+            border-radius: 50%;
+            flex-shrink: 0;
         }
-
-        th {
-            background: linear-gradient(135deg, #667eea 0%, #764ba2 100%);
-            color: white;
-            padding: 15px;
-            text-align: left;
+        .sb-count {
+            margin-left: auto;
+            font-size: 11px;
             font-weight: 600;
-            text-transform: uppercase;
-            font-size: 0.85em;
-            letter-spacing: 0.5px;
+            background: rgba(255,255,255,.09);
+            padding: 1px 7px;
+            border-radius: 10px;
+            color: rgba(255,255,255,.45);
+            min-width: 24px;
+            text-align: center;
         }
 
-        td {
-            padding: 12px 15px;
-            border-bottom: 1px solid #e0e0e0;
-            color: #333;
+        /* ── Main content ────────────────────────────────────────────── */
+        #main {
+            margin-left: 226px;
+            flex: 1;
+            min-width: 0;
+            display: flex;
+            flex-direction: column;
         }
 
-        tr:hover {
-            background: #f5f5f5;
+        /* ── Top bar ─────────────────────────────────────────────────── */
+        #topbar {
+            background: var(--surface);
+            border-bottom: 1px solid var(--border);
+            padding: 13px 28px;
+            display: flex;
+            align-items: center;
+            gap: 16px;
+            position: sticky;
+            top: 0;
+            z-index: 90;
+            box-shadow: var(--shadow);
         }
+        .topbar-title  { font-size: 15px; font-weight: 700; color: var(--text-primary); }
+        .topbar-sub    { font-size: 11.5px; color: var(--text-secondary); margin-top: 1px; }
+        .topbar-right  { margin-left: auto; display: flex; align-items: center; gap: 10px; }
 
-        .no-data {
-            text-align: center;
-            padding: 40px;
-            color: #999;
-            font-style: italic;
+        .refresh-pill {
+            display: flex;
+            align-items: center;
+            gap: 6px;
+            font-size: 12px;
+            color: var(--text-secondary);
+            background: var(--bg);
+            border: 1px solid var(--border);
+            padding: 5px 13px;
+            border-radius: 20px;
         }
 
-        .success {
-            color: #4CAF50;
-            font-weight: bold;
+        .btn {
+            padding: 6px 14px;
+            border-radius: var(--radius-sm);
+            font-size: 12px;
+            font-weight: 500;
+            cursor: pointer;
+            border: 1px solid var(--border);
+            background: transparent;
+            color: var(--text-secondary);
+            transition: all .13s;
         }
+        .btn:hover { background: var(--bg); color: var(--text-primary); }
 
-        .failure {
-            color: #f44336;
-            font-weight: bold;
-        }
+        /* ── Page body ───────────────────────────────────────────────── */
+        .page-body { padding: 24px 28px; flex: 1; }
 
-        .confidence-high {
-            color: #4CAF50;
-            font-weight: bold;
+        /* ── Section label ───────────────────────────────────────────── */
+        .section-label {
+            font-size: 10.5px;
+            font-weight: 700;
+            text-transform: uppercase;
+            letter-spacing: 1px;
+            color: var(--text-muted);
+            padding-bottom: 10px;
+            margin-bottom: 16px;
+            border-bottom: 1px solid var(--border);
+            margin-top: 8px;
         }
 
-        .confidence-medium {
-            color: #FF9800;
-            font-weight: bold;
+        /* ── KPI grid ────────────────────────────────────────────────── */
+        .kpi-grid {
+            display: grid;
+            grid-template-columns: repeat(auto-fill, minmax(155px, 1fr));
+            gap: 14px;
+            margin-bottom: 28px;
         }
-
-        .confidence-low {
-            color: #f44336;
-            font-weight: bold;
+        .kpi-card {
+            background: var(--surface);
+            border: 1px solid var(--border);
+            border-radius: var(--radius);
+            padding: 16px 18px;
+            box-shadow: var(--shadow);
+            position: relative;
+            overflow: hidden;
         }
-
-        .timestamp {
-            color: #999;
-            font-size: 0.85em;
+        .kpi-card::before {
+            content: '';
+            position: absolute;
+            top: 0; left: 0; right: 0;
+            height: 3px;
+            background: var(--accent, #3b82f6);
         }
-
-        .controls {
-            display: flex;
-            gap: 10px;
-            align-items: center;
+        .kpi-value {
+            font-size: 30px;
+            font-weight: 700;
+            color: var(--text-primary);
+            line-height: 1;
+            margin-bottom: 6px;
+            font-variant-numeric: tabular-nums;
         }
-
-        button {
-            background: #667eea;
-            color: white;
-            border: none;
-            padding: 10px 20px;
-            border-radius: 5px;
-            cursor: pointer;
-            font-size: 0.9em;
-            transition: all 0.3s;
+        .kpi-label {
+            font-size: 11px;
+            font-weight: 600;
+            text-transform: uppercase;
+            letter-spacing: .7px;
+            color: var(--text-secondary);
+        }
+        .kpi-sub {
+            font-size: 10.5px;
+            color: var(--text-muted);
+            margin-top: 3px;
         }
 
-        button:hover {
-            background: #764ba2;
-            transform: translateY(-2px);
-            box-shadow: 0 5px 15px rgba(0,0,0,0.2);
+        /* ── Section cards ───────────────────────────────────────────── */
+        .section-card {
+            background: var(--surface);
+            border: 1px solid var(--border);
+            border-radius: var(--radius);
+            box-shadow: var(--shadow);
+            margin-bottom: 22px;
+            overflow: hidden;
         }
 
-        .auto-refresh {
+        .section-head {
+            padding: 15px 20px;
+            border-bottom: 1px solid var(--border);
             display: flex;
             align-items: center;
-            gap: 10px;
-            color: white;
-            background: rgba(255,255,255,0.2);
-            padding: 10px 15px;
-            border-radius: 5px;
+            gap: 12px;
+            background: #fafbfc;
         }
-
-        .indicator {
-            width: 12px;
-            height: 12px;
-            border-radius: 50%;
-            background: #4CAF50;
-            animation: pulse 2s infinite;
-        }
-
-        @keyframes pulse {
-            0%, 100% { opacity: 1; }
-            50% { opacity: 0.5; }
+        .section-accent {
+            width: 4px;
+            height: 38px;
+            border-radius: 3px;
+            flex-shrink: 0;
         }
-
-        .bbox-coords {
-            font-family: 'Courier New', monospace;
-            font-size: 0.9em;
-            color: #666;
+        .section-title      { font-size: 14px; font-weight: 700; color: var(--text-primary); }
+        .section-subtitle   { font-size: 11px; color: var(--text-secondary); margin-top: 2px; font-family: monospace; }
+        .section-badge {
+            margin-left: auto;
+            font-size: 11px;
+            font-weight: 700;
+            padding: 4px 12px;
+            border-radius: 14px;
+            color: #fff;
+            white-space: nowrap;
         }
 
-        .metric-bar {
+        /* ── Metric strip ────────────────────────────────────────────── */
+        .metric-strip {
             display: flex;
-            gap: 15px;
-            margin-top: 15px;
-            padding: 15px;
-            background: #f8f9fa;
-            border-radius: 8px;
+            border-bottom: 1px solid var(--border);
         }
-
-        .metric-item {
+        .metric-tile {
             flex: 1;
+            padding: 14px 18px;
             text-align: center;
+            border-right: 1px solid var(--border);
         }
-
-        .metric-value {
-            font-size: 1.5em;
-            font-weight: bold;
-            color: #667eea;
+        .metric-tile:last-child { border-right: none; }
+        .metric-val {
+            font-size: 22px;
+            font-weight: 700;
+            color: var(--text-primary);
+            font-variant-numeric: tabular-nums;
+            line-height: 1;
         }
-
-        .metric-label {
-            font-size: 0.85em;
-            color: #666;
+        .metric-lbl {
+            font-size: 10.5px;
+            font-weight: 600;
+            text-transform: uppercase;
+            letter-spacing: .6px;
+            color: var(--text-secondary);
             margin-top: 5px;
         }
 
-        .scroll-table {
-            max-height: 500px;
+        /* ── Tables ──────────────────────────────────────────────────── */
+        .table-wrap {
+            overflow-x: auto;
+            max-height: 420px;
             overflow-y: auto;
-            border: 1px solid #e0e0e0;
-            border-radius: 8px;
         }
+        .table-wrap::-webkit-scrollbar { width: 5px; height: 5px; }
+        .table-wrap::-webkit-scrollbar-track { background: transparent; }
+        .table-wrap::-webkit-scrollbar-thumb { background: #cbd5e1; border-radius: 3px; }
+        .table-wrap::-webkit-scrollbar-thumb:hover { background: #94a3b8; }
+
+        table { width: 100%; border-collapse: collapse; font-size: 13px; }
 
-        .scroll-table::-webkit-scrollbar {
-            width: 10px;
+        thead tr { position: sticky; top: 0; z-index: 10; }
+        th {
+            background: #f8fafc;
+            color: var(--text-secondary);
+            font-size: 10.5px;
+            font-weight: 700;
+            text-transform: uppercase;
+            letter-spacing: .7px;
+            padding: 10px 14px;
+            text-align: left;
+            border-bottom: 2px solid var(--border);
+            white-space: nowrap;
+        }
+        td {
+            padding: 10px 14px;
+            border-bottom: 1px solid #f1f5f9;
+            vertical-align: middle;
         }
+        tbody tr:hover td { background: #f8fafc; }
+        tbody tr:last-child td { border-bottom: none; }
 
-        .scroll-table::-webkit-scrollbar-track {
-            background: #f1f1f1;
-            border-radius: 10px;
+        .no-data-row td {
+            text-align: center;
+            padding: 38px 20px;
+            color: var(--text-muted);
+            font-style: italic;
+            font-size: 13px;
+        }
+        .no-data-row code {
+            font-size: 12px;
+            background: #f1f5f9;
+            padding: 1px 6px;
+            border-radius: 4px;
+            color: var(--text-secondary);
+            font-style: normal;
         }
 
-        .scroll-table::-webkit-scrollbar-thumb {
-            background: #667eea;
+        /* ── Chip / badge ────────────────────────────────────────────── */
+        .chip {
+            display: inline-flex;
+            align-items: center;
+            gap: 3px;
+            padding: 2px 8px;
             border-radius: 10px;
+            font-size: 11px;
+            font-weight: 600;
+            white-space: nowrap;
+            vertical-align: middle;
         }
-
-        .scroll-table::-webkit-scrollbar-thumb:hover {
-            background: #764ba2;
+        .chip-ok    { background: #dcfce7; color: #15803d; }
+        .chip-fail  { background: #fee2e2; color: #dc2626; }
+        .chip-muted { background: #f1f5f9; color: #64748b; }
+        .chip-label { background: #ede9fe; color: #6d28d9; }
+        .chip-rel   { background: #ccfbf1; color: #0f766e; }
+        .chip-run   {
+            background: var(--bg);
+            border: 1px solid var(--border);
+            border-radius: 6px;
+            padding: 2px 9px;
+            font-size: 12px;
+            font-weight: 700;
+            font-variant-numeric: tabular-nums;
+            color: var(--text-primary);
         }
 
-        .relation-text {
-            font-style: italic;
-            color: #555;
+        /* ── Monospace ───────────────────────────────────────────────── */
+        .mono {
+            font-family: 'SFMono-Regular', 'Consolas', 'Liberation Mono', monospace;
+            font-size: 11.5px;
+            color: var(--text-secondary);
         }
-
-        .object-label {
-            display: inline-block;
-            background: #e3f2fd;
-            padding: 4px 10px;
-            border-radius: 12px;
-            font-size: 0.9em;
-            font-weight: 500;
-            color: #1976d2;
-            margin: 2px;
+        .ts { font-size: 11px; color: var(--text-muted); white-space: nowrap; }
+
+        /* ── Confidence progress bar ─────────────────────────────────── */
+        .conf-bar { display: flex; align-items: center; gap: 7px; }
+        .conf-track {
+            width: 56px; height: 5px;
+            background: #e2e8f0;
+            border-radius: 3px;
+            overflow: hidden;
+            flex-shrink: 0;
+        }
+        .conf-fill { height: 100%; border-radius: 3px; transition: width .3s ease; }
+        .conf-fill.high { background: var(--ok); }
+        .conf-fill.med  { background: var(--warn); }
+        .conf-fill.low  { background: var(--fail); }
+        .conf-num {
+            font-size: 12px;
+            font-weight: 600;
+            font-variant-numeric: tabular-nums;
+            min-width: 34px;
+        }
+        .conf-num.high { color: #15803d; }
+        .conf-num.med  { color: #92400e; }
+        .conf-num.low  { color: #b91c1c; }
+
+        /* ── Footer ──────────────────────────────────────────────────── */
+        .footer {
+            border-top: 1px solid var(--border);
+            padding: 11px 28px;
+            display: flex;
+            align-items: center;
+            justify-content: space-between;
+            font-size: 11px;
+            color: var(--text-muted);
+            background: var(--surface);
         }
     </style>
 </head>
 <body>
-    <div class="container">
-        <header>
-            <h1>🎯 Vision Benchmark Dashboard</h1>
-            <p class="subtitle">Real-time monitoring of ROS2 Vision Pipeline Services</p>
-        </header>
-
-        <div class="auto-refresh">
-            <div class="indicator"></div>
-            <span>Auto-refreshing every 2 seconds</span>
-            <button onclick="clearData()" style="margin-left: auto;">Clear All Data</button>
+
+<!-- ══════════════════════════════════ SIDEBAR ══════════════════════════════ -->
+<nav id="sidebar">
+    <div class="sb-brand">
+        <div class="sb-brand-title">Vision Pipeline<br>Research Dashboard</div>
+        <div class="sb-brand-sub">ROS 2 · Real-time Monitor</div>
+    </div>
+    <div class="sb-live">
+        <div class="live-dot"></div>
+        Live · 2 s auto-refresh
+    </div>
+
+    <div class="sb-group">Overview</div>
+    <div class="sb-link" onclick="jumpTo('sec-kpi')">
+        <div class="sb-dot" style="background:#64748b"></div>
+        System KPIs
+    </div>
+
+    <div class="sb-group">Run History</div>
+    <div class="sb-link" onclick="jumpTo('sec-runs')">
+        <div class="sb-dot" style="background:var(--color-runs)"></div>
+        Run Summary
+        <span class="sb-count" id="nav-runs">0</span>
+    </div>
+    <div class="sb-link" onclick="jumpTo('sec-objects')">
+        <div class="sb-dot" style="background:var(--color-objects)"></div>
+        Latest Objects
+        <span class="sb-count" id="nav-objects">0</span>
+    </div>
+    <div class="sb-link" onclick="jumpTo('sec-relations')">
+        <div class="sb-dot" style="background:var(--color-relations)"></div>
+        Relations
+        <span class="sb-count" id="nav-relations">0</span>
+    </div>
+
+    <div class="sb-group">Service Monitor</div>
+    <div class="sb-link" onclick="jumpTo('sec-sam')">
+        <div class="sb-dot" style="background:var(--color-sam)"></div>
+        SAM Detection
+        <span class="sb-count" id="nav-sam">0</span>
+    </div>
+    <div class="sb-link" onclick="jumpTo('sec-clip')">
+        <div class="sb-dot" style="background:var(--color-clip)"></div>
+        CLIP Classify
+        <span class="sb-count" id="nav-clip">0</span>
+    </div>
+    <div class="sb-link" onclick="jumpTo('sec-grasp')">
+        <div class="sb-dot" style="background:var(--color-grasp)"></div>
+        GraspNet
+        <span class="sb-count" id="nav-grasp">0</span>
+    </div>
+    <div class="sb-link" onclick="jumpTo('sec-scene')">
+        <div class="sb-dot" style="background:var(--color-scene)"></div>
+        Scene Understanding
+        <span class="sb-count" id="nav-scene">0</span>
+    </div>
+    <div class="sb-link" onclick="jumpTo('sec-pixel')">
+        <div class="sb-dot" style="background:var(--color-pixel)"></div>
+        Pixel → Real
+        <span class="sb-count" id="nav-pixel">0</span>
+    </div>
+</nav>
+
+<!-- ══════════════════════════════════ MAIN ═════════════════════════════════ -->
+<div id="main">
+
+    <!-- Top bar -->
+    <div id="topbar">
+        <div>
+            <div class="topbar-title">Vision Pipeline Research Dashboard</div>
+            <div class="topbar-sub">Segment Anything Model · CLIP · GraspNet · Scene Understanding · ROS 2</div>
         </div>
+        <div class="topbar-right">
+            <div class="refresh-pill">
+                <div class="live-dot"></div>
+                Auto-refresh every 2 s
+            </div>
+            <button class="btn" onclick="clearData()">Clear Session Data</button>
+        </div>
+    </div>
 
-        <div class="stats-bar">
-            <div class="stat-card">
-                <div class="stat-number" id="totalCalls">0</div>
-                <div class="stat-label">Total Service Calls</div>
+    <div class="page-body">
+
+        <!-- ── System KPIs ──────────────────────────────────────────── -->
+        <div id="sec-kpi" class="section-label">System Overview</div>
+        <div class="kpi-grid">
+            <div class="kpi-card" style="--accent:var(--color-runs)">
+                <div class="kpi-value" id="runHistoryCount">0</div>
+                <div class="kpi-label">Stored Runs</div>
+                <div class="kpi-sub">Rolling last 20</div>
+            </div>
+            <div class="kpi-card" style="--accent:var(--color-sam)">
+                <div class="kpi-value" id="samCount">0</div>
+                <div class="kpi-label">SAM Records</div>
             </div>
-            <div class="stat-card">
-                <div class="stat-number" id="pixelCount">0</div>
-                <div class="stat-label">Pixel to Real</div>
+            <div class="kpi-card" style="--accent:var(--color-clip)">
+                <div class="kpi-value" id="clipCount">0</div>
+                <div class="kpi-label">CLIP Records</div>
             </div>
-            <div class="stat-card">
-                <div class="stat-number" id="samCount">0</div>
-                <div class="stat-label">SAM Detections</div>
+            <div class="kpi-card" style="--accent:var(--color-grasp)">
+                <div class="kpi-value" id="graspCount">0</div>
+                <div class="kpi-label">Grasp Records</div>
             </div>
-            <div class="stat-card">
-                <div class="stat-number" id="clipCount">0</div>
-                <div class="stat-label">CLIP Classifications</div>
+            <div class="kpi-card" style="--accent:var(--color-scene)">
+                <div class="kpi-value" id="sceneCount">0</div>
+                <div class="kpi-label">Scene Records</div>
             </div>
-            <div class="stat-card">
-                <div class="stat-number" id="graspCount">0</div>
-                <div class="stat-label">Grasp Detections</div>
+            <div class="kpi-card" style="--accent:var(--color-pixel)">
+                <div class="kpi-value" id="pixelCount">0</div>
+                <div class="kpi-label">Pixel→Real</div>
             </div>
-            <div class="stat-card">
-                <div class="stat-number" id="sceneCount">0</div>
-                <div class="stat-label">Scene Analysis</div>
+            <div class="kpi-card" style="--accent:#64748b">
+                <div class="kpi-value" id="totalCalls">0</div>
+                <div class="kpi-label">Total Svc Calls</div>
+                <div class="kpi-sub">This session</div>
             </div>
         </div>
 
-        <!-- Pixel to Real Section -->
-        <div class="section">
-            <div class="section-header">
-                <h2>📍 Pixel to Real Conversion</h2>
-                <span class="badge" id="pixelBadge">0 Records</span>
+        <!-- ── Run History ──────────────────────────────────────────── -->
+        <div id="sec-runs" class="section-label">Run History · collect_and_export.py</div>
+        <div class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:var(--color-runs)"></div>
+                <div>
+                    <div class="section-title">Vision Run Summary</div>
+                    <div class="section-subtitle">vision_runs_history.json · newest first · max 20 runs</div>
+                </div>
+                <span class="section-badge" id="runHistoryBadge" style="background:var(--color-runs)">0 Runs</span>
             </div>
-            <div class="scroll-table">
-                <table id="pixelTable">
-                    <thead>
-                        <tr>
-                            <th>Test ID</th>
-                            <th>Timestamp</th>
-                            <th>Input U (px)</th>
-                            <th>Input V (px)</th>
-                            <th>Output X (m)</th>
-                            <th>Output Y (m)</th>
-                            <th>Output Z (m)</th>
-                        </tr>
-                    </thead>
-                    <tbody id="pixelBody">
-                        <tr><td colspan="7" class="no-data">No data available</td></tr>
+            <div class="metric-strip">
+                <div class="metric-tile">
+                    <div class="metric-val" id="rhTotalRuns">—</div>
+                    <div class="metric-lbl">Total Runs</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="rhLastObjects">—</div>
+                    <div class="metric-lbl">Last Objects</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="rhLastRelations">—</div>
+                    <div class="metric-lbl">Last Relations</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="rhLastLatency">—</div>
+                    <div class="metric-lbl">Last Latency</div>
+                </div>
+            </div>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Run</th>
+                        <th>Timestamp</th>
+                        <th>Latency (s)</th>
+                        <th>SAM Detections</th>
+                        <th>SAM Avg Conf</th>
+                        <th>CLIP Filtered</th>
+                        <th>Scene Objects</th>
+                        <th>Relations</th>
+                        <th>Graspable</th>
+                        <th>SAM</th>
+                        <th>CLIP</th>
+                        <th>Scene</th>
+                    </tr></thead>
+                    <tbody id="runHistoryBody">
+                        <tr class="no-data-row"><td colspan="12">No run history yet — run <code>collect_and_export.py</code></td></tr>
+                    </tbody>
+                </table>
+            </div>
+        </div>
+
+        <!-- ── Latest Objects ───────────────────────────────────────── -->
+        <div id="sec-objects" class="section-label">Latest Run Detail</div>
+        <div class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:var(--color-objects)"></div>
+                <div>
+                    <div class="section-title">Detected Objects — Latest Run</div>
+                    <div class="section-subtitle">Merged SAM · CLIP · GraspNet per-object data</div>
+                </div>
+                <span class="section-badge" id="latestObjectsBadge" style="background:var(--color-objects)">0 Objects</span>
+            </div>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Object ID</th>
+                        <th>Label</th>
+                        <th>Bounding Box</th>
+                        <th>SAM Confidence</th>
+                        <th>CLIP Confidence</th>
+                        <th>Distance (cm)</th>
+                        <th>IoU</th>
+                        <th>Stable</th>
+                        <th>Has Grasp</th>
+                        <th>Grasp Quality</th>
+                    </tr></thead>
+                    <tbody id="latestObjectsBody">
+                        <tr class="no-data-row"><td colspan="10">No data yet</td></tr>
+                    </tbody>
+                </table>
+            </div>
+        </div>
+
+        <!-- ── Latest Relations ─────────────────────────────────────── -->
+        <div class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:var(--color-relations)"></div>
+                <div>
+                    <div class="section-title">Spatial Relations — Latest Run</div>
+                    <div class="section-subtitle">Object-level spatial relation graph · Scene Understanding output</div>
+                </div>
+                <span class="section-badge" id="latestRelationsBadge" style="background:var(--color-relations)">0 Relations</span>
+            </div>
+            <div id="sec-relations" class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Subject</th>
+                        <th>Relation</th>
+                        <th>Target</th>
+                        <th>Confidence</th>
+                        <th>Distance 2D</th>
+                        <th>Description</th>
+                    </tr></thead>
+                    <tbody id="latestRelationsBody">
+                        <tr class="no-data-row"><td colspan="6">No data yet</td></tr>
                     </tbody>
                 </table>
             </div>
         </div>
 
-        <!-- SAM Detections Section -->
-        <div class="section">
-            <div class="section-header">
-                <h2>🎯 SAM Object Detection</h2>
-                <span class="badge" id="samBadge">0 Records</span>
+        <!-- ── SAM ──────────────────────────────────────────────────── -->
+        <div id="sec-sam" class="section-label">Service Monitor</div>
+        <div class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:var(--color-sam)"></div>
+                <div>
+                    <div class="section-title">SAM — Segment Anything Model</div>
+                    <div class="section-subtitle">/vision/run_pipeline · /vision/detect_objects</div>
+                </div>
+                <span class="section-badge" id="samBadge" style="background:var(--color-sam)">0 Records</span>
             </div>
-            <div class="metric-bar">
-                <div class="metric-item">
-                    <div class="metric-value" id="samAvgIoU">0.00</div>
-                    <div class="metric-label">Avg IoU</div>
+            <div class="metric-strip">
+                <div class="metric-tile">
+                    <div class="metric-val" id="samAvgConf">—</div>
+                    <div class="metric-lbl">Avg Confidence</div>
                 </div>
-                <div class="metric-item">
-                    <div class="metric-value" id="samStableRate">0%</div>
-                    <div class="metric-label">Stability Rate</div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="samAvgIoU">—</div>
+                    <div class="metric-lbl">Avg IoU</div>
                 </div>
-                <div class="metric-item">
-                    <div class="metric-value" id="samAvgConf">0.00</div>
-                    <div class="metric-label">Avg Confidence</div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="samStableRate">—</div>
+                    <div class="metric-lbl">Stability Rate</div>
                 </div>
             </div>
-            <div class="scroll-table">
-                <table id="samTable">
-                    <thead>
-                        <tr>
-                            <th>Object ID</th>
-                            <th>Bounding Box</th>
-                            <th>Center Point</th>
-                            <th>Confidence</th>
-                            <th>IoU Score</th>
-                            <th>AP (IoU≥0.5)</th>
-                            <th>Distance (cm)</th>
-                            <th>Timestamp</th>
-                        </tr>
-                    </thead>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Object ID</th>
+                        <th>Bounding Box</th>
+                        <th>Center (u, v)</th>
+                        <th>Confidence</th>
+                        <th>IoU Score</th>
+                        <th>AP ≥ 0.5</th>
+                        <th>Distance (cm)</th>
+                        <th>Timestamp</th>
+                    </tr></thead>
                     <tbody id="samBody">
-                        <tr><td colspan="8" class="no-data">No data available</td></tr>
+                        <tr class="no-data-row"><td colspan="8">No SAM data — start <code>/vision/run_pipeline</code></td></tr>
                     </tbody>
                 </table>
             </div>
         </div>
 
-        <!-- CLIP Classifications Section -->
-        <div class="section">
-            <div class="section-header">
-                <h2>🏷️ CLIP Classification</h2>
-                <span class="badge" id="clipBadge">0 Records</span>
+        <!-- ── CLIP ─────────────────────────────────────────────────── -->
+        <div id="sec-clip" class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:var(--color-clip)"></div>
+                <div>
+                    <div class="section-title">CLIP — Contrastive Language–Image Pre-training</div>
+                    <div class="section-subtitle">/vision/classify_bbox_filtered · /vision/classify_all</div>
+                </div>
+                <span class="section-badge" id="clipBadge" style="background:var(--color-clip)">0 Records</span>
             </div>
-            <div class="metric-bar">
-                <div class="metric-item">
-                    <div class="metric-value" id="clipTop1">N/A</div>
-                    <div class="metric-label">Top-1 Accuracy</div>
+            <div class="metric-strip">
+                <div class="metric-tile">
+                    <div class="metric-val" id="clipTop1">—</div>
+                    <div class="metric-lbl">Top-1 Accuracy</div>
                 </div>
-                <div class="metric-item">
-                    <div class="metric-value" id="clipAvgConf">0.00</div>
-                    <div class="metric-label">Avg Confidence</div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="clipAvgConf">—</div>
+                    <div class="metric-lbl">Avg Confidence</div>
                 </div>
             </div>
-            <div class="scroll-table">
-                <table id="clipTable">
-                    <thead>
-                        <tr>
-                            <th>Test ID</th>
-                            <th>Label</th>
-                            <th>Confidence</th>
-                            <th>Top-1 Accuracy</th>
-                            <th>Bounding Box</th>
-                            <th>Timestamp</th>
-                        </tr>
-                    </thead>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Test ID</th>
+                        <th>Label</th>
+                        <th>Confidence</th>
+                        <th>Top-1 Accuracy</th>
+                        <th>Bounding Box</th>
+                        <th>Timestamp</th>
+                    </tr></thead>
                     <tbody id="clipBody">
-                        <tr><td colspan="6" class="no-data">No data available</td></tr>
+                        <tr class="no-data-row"><td colspan="6">No CLIP data — start <code>/vision/classify_bbox_filtered</code></td></tr>
                     </tbody>
                 </table>
             </div>
         </div>
 
-        <!-- GraspNet Section -->
-        <div class="section">
-            <div class="section-header">
-                <h2>🤖 Grasp Detection</h2>
-                <span class="badge" id="graspBadge">0 Records</span>
+        <!-- ── GraspNet ──────────────────────────────────────────────── -->
+        <div id="sec-grasp" class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:var(--color-grasp)"></div>
+                <div>
+                    <div class="section-title">GraspNet — 6-DoF Grasp Pose Estimation</div>
+                    <div class="section-subtitle">/vision/detect_grasp · /vision/detect_grasp_bbox</div>
+                </div>
+                <span class="section-badge" id="graspBadge" style="background:var(--color-grasp)">0 Records</span>
             </div>
-            <div class="metric-bar">
-                <div class="metric-item">
-                    <div class="metric-value" id="graspAvgQuality">0.00</div>
-                    <div class="metric-label">Avg Quality Score</div>
+            <div class="metric-strip">
+                <div class="metric-tile">
+                    <div class="metric-val" id="graspAvgQuality">—</div>
+                    <div class="metric-lbl">Avg Quality Score</div>
                 </div>
-                <div class="metric-item">
-                    <div class="metric-value" id="graspAvgWidth">0.00m</div>
-                    <div class="metric-label">Avg Grasp Width</div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="graspAvgWidth">—</div>
+                    <div class="metric-lbl">Avg Grasp Width</div>
                 </div>
             </div>
-            <div class="scroll-table">
-                <table id="graspTable">
-                    <thead>
-                        <tr>
-                            <th>Test ID</th>
-                            <th>Object ID</th>
-                            <th>Position (u,v)</th>
-                            <th>Position (x,y,z)</th>
-                            <th>Quality Score</th>
-                            <th>Grasp Width</th>
-                            <th>Approach</th>
-                            <th>Timestamp</th>
-                        </tr>
-                    </thead>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Test ID</th>
+                        <th>Object ID</th>
+                        <th>Pixel (u, v)</th>
+                        <th>World (x, y, z) m</th>
+                        <th>Quality Score</th>
+                        <th>Width (m)</th>
+                        <th>Approach</th>
+                        <th>Timestamp</th>
+                    </tr></thead>
                     <tbody id="graspBody">
-                        <tr><td colspan="8" class="no-data">No data available</td></tr>
+                        <tr class="no-data-row"><td colspan="8">No grasp data — start <code>/vision/detect_grasp</code></td></tr>
                     </tbody>
                 </table>
             </div>
         </div>
 
-        <!-- Scene Understanding Section -->
-        <div class="section">
-            <div class="section-header">
-                <h2>🌐 Scene Understanding</h2>
-                <span class="badge" id="sceneBadge">0 Records</span>
+        <!-- ── Scene Understanding ───────────────────────────────────── -->
+        <div id="sec-scene" class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:var(--color-scene)"></div>
+                <div>
+                    <div class="section-title">Scene Understanding — Holistic Analysis</div>
+                    <div class="section-subtitle">/vision/understand_scene · spatial reasoning + object relations</div>
+                </div>
+                <span class="section-badge" id="sceneBadge" style="background:var(--color-scene)">0 Records</span>
             </div>
-            <div class="metric-bar">
-                <div class="metric-item">
-                    <div class="metric-value" id="sceneObjects">0</div>
-                    <div class="metric-label">Total Objects</div>
+            <div class="metric-strip">
+                <div class="metric-tile">
+                    <div class="metric-val" id="sceneObjects">—</div>
+                    <div class="metric-lbl">Total Objects</div>
                 </div>
-                <div class="metric-item">
-                    <div class="metric-value" id="sceneRelations">0</div>
-                    <div class="metric-label">Relations</div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="sceneRelations">—</div>
+                    <div class="metric-lbl">Relations</div>
                 </div>
-                <div class="metric-item">
-                    <div class="metric-value" id="sceneSpatialAcc">0%</div>
-                    <div class="metric-label">Spatial Accuracy</div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="sceneSpatialAcc">—</div>
+                    <div class="metric-lbl">Spatial Accuracy</div>
                 </div>
-                <div class="metric-item">
-                    <div class="metric-value" id="sceneAdjacencyAcc">0%</div>
-                    <div class="metric-label">Adjacency Accuracy</div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="sceneAdjacencyAcc">—</div>
+                    <div class="metric-lbl">Adjacency Accuracy</div>
                 </div>
             </div>
-            <div class="scroll-table">
-                <table id="sceneTable">
-                    <thead>
-                        <tr>
-                            <th>Scene ID</th>
-                            <th>Objects</th>
-                            <th>Relations</th>
-                            <th>Description</th>
-                            <th>Spatial Acc</th>
-                            <th>Adjacency Acc</th>
-                            <th>Timestamp</th>
-                        </tr>
-                    </thead>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Scene ID</th>
+                        <th>Objects</th>
+                        <th>Relations</th>
+                        <th>Scene Description</th>
+                        <th>Spatial Acc</th>
+                        <th>Adjacency Acc</th>
+                        <th>Timestamp</th>
+                    </tr></thead>
                     <tbody id="sceneBody">
-                        <tr><td colspan="7" class="no-data">No data available</td></tr>
+                        <tr class="no-data-row"><td colspan="7">No scene data — start <code>/vision/understand_scene</code></td></tr>
                     </tbody>
                 </table>
             </div>
         </div>
+
+        <!-- ── Pixel to Real ────────────────────────────────────────── -->
+        <div id="sec-pixel" class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:var(--color-pixel)"></div>
+                <div>
+                    <div class="section-title">Pixel → Real World Conversion</div>
+                    <div class="section-subtitle">/pixel_to_real · camera-to-world coordinate projection</div>
+                </div>
+                <span class="section-badge" id="pixelBadge" style="background:var(--color-pixel)">0 Records</span>
+            </div>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Test ID</th>
+                        <th>Timestamp</th>
+                        <th>Input U (px)</th>
+                        <th>Input V (px)</th>
+                        <th>Output X (m)</th>
+                        <th>Output Y (m)</th>
+                        <th>Output Z (m)</th>
+                    </tr></thead>
+                    <tbody id="pixelBody">
+                        <tr class="no-data-row"><td colspan="7">No data — call <code>/pixel_to_real</code></td></tr>
+                    </tbody>
+                </table>
+            </div>
+        </div>
+
+    </div><!-- /page-body -->
+
+    <div class="footer">
+        <span>Vision Pipeline Research Dashboard · ROS 2</span>
+        <span>Last updated: <span id="lastUpdated">—</span></span>
     </div>
+</div><!-- /main -->
+
+<script>
+    // ── Utilities ─────────────────────────────────────────────────────────────
+
+    function confClass(v) {
+        if (v >= 0.7) return 'high';
+        if (v >= 0.4) return 'med';
+        return 'low';
+    }
+
+    function confBar(v) {
+        if (v == null) return '<span style="color:var(--text-muted)">—</span>';
+        const cls = confClass(v);
+        const pct = Math.min(100, Math.round(v * 100));
+        return `<div class="conf-bar">
+            <div class="conf-track"><div class="conf-fill ${cls}" style="width:${pct}%"></div></div>
+            <span class="conf-num ${cls}">${v.toFixed(2)}</span>
+        </div>`;
+    }
+
+    function chipOk(val) {
+        return val
+            ? '<span class="chip chip-ok">&#10003; Pass</span>'
+            : '<span class="chip chip-fail">&#10007; Fail</span>';
+    }
+
+    function chipSvc(val) {
+        return val
+            ? '<span class="chip chip-ok">&#10003;</span>'
+            : '<span class="chip chip-fail">&#10007;</span>';
+    }
+
+    function tsShort(t) {
+        if (!t) return '<span class="ts">—</span>';
+        return `<span class="ts">${new Date(t).toLocaleTimeString()}</span>`;
+    }
+
+    function setNav(id, count) {
+        const el = document.getElementById(id);
+        if (el) el.textContent = count;
+    }
+
+    function jumpTo(id) {
+        const el = document.getElementById(id);
+        if (el) el.scrollIntoView({ behavior: 'smooth', block: 'start' });
+    }
+
+    function formatAccuracy(val) {
+        if (val === null || val === undefined) return '<span style="color:var(--text-muted)">N/A</span>';
+        return val
+            ? '<span class="chip chip-ok">&#10003; True</span>'
+            : '<span class="chip chip-fail">&#10007; False</span>';
+    }
+
+    // ── /api/data ─────────────────────────────────────────────────────────────
+    let lastData = null;
+
+    async function fetchData() {
+        try {
+            const res = await fetch('/api/data');
+            lastData = await res.json();
+            updateDashboard(lastData);
+        } catch (e) {
+            console.warn('Error fetching /api/data:', e);
+        }
+    }
+
+    function updateDashboard(data) {
+        document.getElementById('totalCalls').textContent = data.metadata.total_calls;
+        document.getElementById('pixelCount').textContent  = data.pixel_to_real.length;
+        document.getElementById('samCount').textContent    = data.sam_detections.length;
+        document.getElementById('clipCount').textContent   = data.clip_classifications.length;
+        document.getElementById('graspCount').textContent  = data.grasp_detections.length;
+        document.getElementById('sceneCount').textContent  = data.scene_understanding.length;
+
+        setNav('nav-sam',   data.sam_detections.length);
+        setNav('nav-clip',  data.clip_classifications.length);
+        setNav('nav-grasp', data.grasp_detections.length);
+        setNav('nav-scene', data.scene_understanding.length);
+        setNav('nav-pixel', data.pixel_to_real.length);
+
+        updatePixelToReal(data.pixel_to_real);
+        updateSAMDetections(data.sam_detections);
+        updateCLIPClassifications(data.clip_classifications);
+        updateGraspDetections(data.grasp_detections);
+        updateSceneUnderstanding(data.scene_understanding);
+        document.getElementById('lastUpdated').textContent = new Date().toLocaleTimeString();
+    }
+
+    // ── Pixel to Real ─────────────────────────────────────────────────────────
+    function updatePixelToReal(records) {
+        document.getElementById('pixelBadge').textContent = `${records.length} Records`;
+        const tbody = document.getElementById('pixelBody');
+        if (!records.length) {
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="7">No data — call <code>/pixel_to_real</code></td></tr>';
+            return;
+        }
+        tbody.innerHTML = records.slice(-50).reverse().map(r => `<tr>
+            <td class="mono">${r.test_id}</td>
+            <td>${tsShort(r.timestamp)}</td>
+            <td class="mono">${r.input.u}</td>
+            <td class="mono">${r.input.v}</td>
+            <td class="mono">${r.output.x.toFixed(4)}</td>
+            <td class="mono">${r.output.y.toFixed(4)}</td>
+            <td class="mono">${r.output.z.toFixed(4)}</td>
+        </tr>`).join('');
+    }
+
+    // ── SAM Detections ────────────────────────────────────────────────────────
+    function updateSAMDetections(records) {
+        document.getElementById('samBadge').textContent = `${records.length} Records`;
+        const tbody = document.getElementById('samBody');
+        if (!records.length) {
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="8">No SAM data — start <code>/vision/run_pipeline</code></td></tr>';
+            ['samAvgConf','samAvgIoU','samStableRate'].forEach(id => document.getElementById(id).textContent = '—');
+            return;
+        }
+        const n = records.length;
+        const avgConf = records.reduce((s, r) => s + r.confidence, 0) / n;
+        const avgIoU  = records.reduce((s, r) => s + r.iou_score, 0) / n;
+        const stRate  = (records.filter(r => r.is_stable).length / n * 100).toFixed(0);
+
+        document.getElementById('samAvgConf').textContent  = avgConf.toFixed(3);
+        document.getElementById('samAvgIoU').textContent   = avgIoU.toFixed(3);
+        document.getElementById('samStableRate').textContent = `${stRate}%`;
+
+        tbody.innerHTML = records.slice(-50).reverse().map(r => `<tr>
+            <td class="mono">${r.obj_id}</td>
+            <td class="mono" style="font-size:11px">(${r.bbox.x1},${r.bbox.y1})→(${r.bbox.x2},${r.bbox.y2})</td>
+            <td class="mono">(${r.center.u}, ${r.center.v})</td>
+            <td>${confBar(r.confidence)}</td>
+            <td>${confBar(r.iou_score)}</td>
+            <td>${chipOk(r.is_stable)}</td>
+            <td class="mono">${r.distance_cm.toFixed(1)}</td>
+            <td>${tsShort(r.timestamp)}</td>
+        </tr>`).join('');
+    }
+
+    // ── CLIP Classifications ──────────────────────────────────────────────────
+    function updateCLIPClassifications(records) {
+        document.getElementById('clipBadge').textContent = `${records.length} Records`;
+        const tbody = document.getElementById('clipBody');
+        if (!records.length) {
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="6">No CLIP data — start <code>/vision/classify_bbox_filtered</code></td></tr>';
+            ['clipTop1','clipAvgConf'].forEach(id => document.getElementById(id).textContent = '—');
+            return;
+        }
+        const withAcc = records.filter(r => r.top1_accuracy !== null);
+        const top1Acc = withAcc.length
+            ? (withAcc.filter(r => r.top1_accuracy).length / withAcc.length * 100).toFixed(1) + '%'
+            : 'N/A';
+        const avgConf = records.reduce((s, r) => s + r.confidence, 0) / records.length;
+
+        document.getElementById('clipTop1').textContent   = top1Acc;
+        document.getElementById('clipAvgConf').textContent = avgConf.toFixed(3);
+
+        tbody.innerHTML = records.slice(-50).reverse().map(r => `<tr>
+            <td class="mono">${r.test_id}</td>
+            <td><span class="chip chip-label">${r.label}</span></td>
+            <td>${confBar(r.confidence)}</td>
+            <td>${formatAccuracy(r.top1_accuracy)}</td>
+            <td class="mono" style="font-size:11px">${JSON.stringify(r.bbox)}</td>
+            <td>${tsShort(r.timestamp)}</td>
+        </tr>`).join('');
+    }
+
+    // ── Grasp Detections ──────────────────────────────────────────────────────
+    function updateGraspDetections(records) {
+        document.getElementById('graspBadge').textContent = `${records.length} Records`;
+        const tbody = document.getElementById('graspBody');
+        if (!records.length) {
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="8">No grasp data — start <code>/vision/detect_grasp</code></td></tr>';
+            ['graspAvgQuality','graspAvgWidth'].forEach(id => document.getElementById(id).textContent = '—');
+            return;
+        }
+        const avgQ = records.reduce((s, r) => s + r.quality_score, 0) / records.length;
+        const avgW = records.reduce((s, r) => s + r.grasp_width,   0) / records.length;
+
+        document.getElementById('graspAvgQuality').textContent = avgQ.toFixed(3);
+        document.getElementById('graspAvgWidth').textContent   = avgW.toFixed(3) + ' m';
+
+        tbody.innerHTML = records.slice(-50).reverse().map(r => `<tr>
+            <td class="mono">${r.test_id}</td>
+            <td class="mono">${r.object_id}</td>
+            <td class="mono">(${r.pixel_position.u}, ${r.pixel_position.v})</td>
+            <td class="mono">(${r.world_position.x.toFixed(3)}, ${r.world_position.y.toFixed(3)}, ${r.world_position.z.toFixed(3)})</td>
+            <td>${confBar(r.quality_score)}</td>
+            <td class="mono">${r.grasp_width.toFixed(3)}</td>
+            <td><span class="chip chip-muted">${r.approach_direction}</span></td>
+            <td>${tsShort(r.timestamp)}</td>
+        </tr>`).join('');
+    }
+
+    // ── Scene Understanding ───────────────────────────────────────────────────
+    function updateSceneUnderstanding(records) {
+        document.getElementById('sceneBadge').textContent = `${records.length} Records`;
+        const tbody = document.getElementById('sceneBody');
+        if (!records.length) {
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="7">No scene data — start <code>/vision/understand_scene</code></td></tr>';
+            ['sceneObjects','sceneRelations','sceneSpatialAcc','sceneAdjacencyAcc'].forEach(id =>
+                document.getElementById(id).textContent = '—');
+            return;
+        }
+        const latest = records[records.length - 1];
+        document.getElementById('sceneObjects').textContent     = latest.total_objects;
+        document.getElementById('sceneRelations').textContent   = latest.relations.length;
+        document.getElementById('sceneSpatialAcc').textContent  = latest.spatial_accuracy.toFixed(0) + '%';
+        document.getElementById('sceneAdjacencyAcc').textContent= latest.adjacency_accuracy.toFixed(0) + '%';
+
+        tbody.innerHTML = records.slice(-20).reverse().map(r => `<tr>
+            <td class="mono">${r.scene_id}</td>
+            <td>${r.object_labels.map(l => `<span class="chip chip-label">${l}</span>`).join(' ')}</td>
+            <td>
+                <div style="max-height:80px;overflow-y:auto;display:flex;flex-wrap:wrap;gap:2px;padding:2px 0">
+                    ${r.relations.map(rel =>
+                        `<span class="chip chip-rel">${rel.subject} <em>${rel.relation}</em> ${rel.object} · ${(rel.confidence*100).toFixed(0)}%</span>`
+                    ).join('')}
+                </div>
+            </td>
+            <td style="max-width:240px;font-size:12px;color:var(--text-secondary)">${r.scene_description}</td>
+            <td>${confBar(r.spatial_accuracy / 100)}</td>
+            <td>${confBar(r.adjacency_accuracy / 100)}</td>
+            <td>${tsShort(r.timestamp)}</td>
+        </tr>`).join('');
+    }
+
+    // ── /api/run-history ──────────────────────────────────────────────────────
+    async function fetchRunHistory() {
+        try {
+            const res  = await fetch('/api/run-history');
+            const runs = await res.json();
+            updateRunHistory(runs);
+        } catch (e) {
+            console.warn('Run history unavailable:', e);
+        }
+    }
+
+    function updateRunHistory(runs) {
+        document.getElementById('runHistoryBadge').textContent = `${runs.length} Runs`;
+        document.getElementById('rhTotalRuns').textContent     = runs.length;
+        document.getElementById('runHistoryCount').textContent = runs.length;
+        setNav('nav-runs', runs.length);
+
+        const tbody    = document.getElementById('runHistoryBody');
+        const objBody  = document.getElementById('latestObjectsBody');
+        const relBody  = document.getElementById('latestRelationsBody');
+
+        const noRuns = '<tr class="no-data-row"><td colspan="12">No run history yet — run <code>collect_and_export.py</code></td></tr>';
+        const noObj  = '<tr class="no-data-row"><td colspan="10">No data yet</td></tr>';
+        const noRel  = '<tr class="no-data-row"><td colspan="6">No data yet</td></tr>';
+
+        if (!runs.length) {
+            tbody.innerHTML   = noRuns;
+            objBody.innerHTML = noObj;
+            relBody.innerHTML = noRel;
+            document.getElementById('latestObjectsBadge').textContent   = '0 Objects';
+            document.getElementById('latestRelationsBadge').textContent = '0 Relations';
+            ['rhLastObjects','rhLastRelations','rhLastLatency'].forEach(id =>
+                document.getElementById(id).textContent = '—');
+            setNav('nav-objects', 0);
+            setNav('nav-relations', 0);
+            return;
+        }
 
-    <script>
-        let lastData = null;
-
-        async function fetchData() {
-            try {
-                const response = await fetch('/api/data');
-                const data = await response.json();
-                lastData = data;
-                updateDashboard(data);
-            } catch (error) {
-                console.error('Error fetching data:', error);
-            }
-        }
-
-        function updateDashboard(data) {
-            // Update stats
-            document.getElementById('totalCalls').textContent = data.metadata.total_calls;
-            document.getElementById('pixelCount').textContent = data.pixel_to_real.length;
-            document.getElementById('samCount').textContent = data.sam_detections.length;
-            document.getElementById('clipCount').textContent = data.clip_classifications.length;
-            document.getElementById('graspCount').textContent = data.grasp_detections.length;
-            document.getElementById('sceneCount').textContent = data.scene_understanding.length;
-
-            // Update Pixel to Real
-            updatePixelToReal(data.pixel_to_real);
-
-            // Update SAM Detections
-            updateSAMDetections(data.sam_detections);
-
-            // Update CLIP Classifications
-            updateCLIPClassifications(data.clip_classifications);
-
-            // Update Grasp Detections
-            updateGraspDetections(data.grasp_detections);
-
-            // Update Scene Understanding
-            updateSceneUnderstanding(data.scene_understanding);
-        }
-
-        function updatePixelToReal(records) {
-            document.getElementById('pixelBadge').textContent = `${records.length} Records`;
-            const tbody = document.getElementById('pixelBody');
-            
-            if (records.length === 0) {
-                tbody.innerHTML = '<tr><td colspan="7" class="no-data">No data available</td></tr>';
-                return;
-            }
-
-            tbody.innerHTML = records.slice(-50).reverse().map(record => `
-                <tr>
-                    <td>${record.test_id}</td>
-                    <td class="timestamp">${formatTimestamp(record.timestamp)}</td>
-                    <td>${record.input.u}</td>
-                    <td>${record.input.v}</td>
-                    <td>${record.output.x.toFixed(3)}</td>
-                    <td>${record.output.y.toFixed(3)}</td>
-                    <td>${record.output.z.toFixed(3)}</td>
-                </tr>
-            `).join('');
-        }
-
-        function updateSAMDetections(records) {
-            document.getElementById('samBadge').textContent = `${records.length} Records`;
-            const tbody = document.getElementById('samBody');
-            
-            if (records.length === 0) {
-                tbody.innerHTML = '<tr><td colspan="8" class="no-data">No data available</td></tr>';
-                document.getElementById('samAvgIoU').textContent = '0.00';
-                document.getElementById('samStableRate').textContent = '0%';
-                document.getElementById('samAvgConf').textContent = '0.00';
-                return;
-            }
-
-            // Calculate metrics
-            const avgIoU = records.reduce((sum, r) => sum + r.iou_score, 0) / records.length;
-            const stableCount = records.filter(r => r.is_stable).length;
-            const stableRate = (stableCount / records.length * 100).toFixed(0);
-            const avgConf = records.reduce((sum, r) => sum + r.confidence, 0) / records.length;
-
-            document.getElementById('samAvgIoU').textContent = avgIoU.toFixed(2);
-            document.getElementById('samStableRate').textContent = `${stableRate}%`;
-            document.getElementById('samAvgConf').textContent = avgConf.toFixed(2);
-
-            tbody.innerHTML = records.slice(-50).reverse().map(record => `
-                <tr>
-                    <td>${record.obj_id}</td>
-                    <td class="bbox-coords">(${record.bbox.x1}, ${record.bbox.y1}, ${record.bbox.x2}, ${record.bbox.y2})</td>
-                    <td class="bbox-coords">(${record.center.u}, ${record.center.v})</td>
-                    <td class="${getConfidenceClass(record.confidence)}">${record.confidence.toFixed(2)}</td>
-                    <td class="${getConfidenceClass(record.iou_score)}">${record.iou_score.toFixed(2)}</td>
-                    <td class="${record.is_stable ? 'success' : 'failure'}">${record.is_stable ? '✓ Pass' : '✗ Fail'}</td>
-                    <td>${record.distance_cm.toFixed(1)}</td>
-                    <td class="timestamp">${formatTimestamp(record.timestamp)}</td>
-                </tr>
-            `).join('');
-        }
-
-        function updateCLIPClassifications(records) {
-            document.getElementById('clipBadge').textContent = `${records.length} Records`;
-            const tbody = document.getElementById('clipBody');
-            
-            if (records.length === 0) {
-                tbody.innerHTML = '<tr><td colspan="6" class="no-data">No data available</td></tr>';
-                document.getElementById('clipTop1').textContent = 'N/A';
-                document.getElementById('clipAvgConf').textContent = '0.00';
-                return;
-            }
-
-            // Calculate metrics
-            const withAccuracy = records.filter(r => r.top1_accuracy !== null);
-            const correctCount = withAccuracy.filter(r => r.top1_accuracy === true).length;
-            const top1Acc = withAccuracy.length > 0 ? (correctCount / withAccuracy.length * 100).toFixed(1) + '%' : 'N/A';
-            const avgConf = records.reduce((sum, r) => sum + r.confidence, 0) / records.length;
-
-            document.getElementById('clipTop1').textContent = top1Acc;
-            document.getElementById('clipAvgConf').textContent = avgConf.toFixed(2);
-
-            tbody.innerHTML = records.slice(-50).reverse().map(record => `
-                <tr>
-                    <td>${record.test_id}</td>
-                    <td><span class="object-label">${record.label}</span></td>
-                    <td class="${getConfidenceClass(record.confidence)}">${record.confidence.toFixed(2)}</td>
-                    <td>${formatAccuracy(record.top1_accuracy)}</td>
-                    <td class="bbox-coords">${JSON.stringify(record.bbox)}</td>
-                    <td class="timestamp">${formatTimestamp(record.timestamp)}</td>
-                </tr>
-            `).join('');
-        }
-
-        function updateGraspDetections(records) {
-            document.getElementById('graspBadge').textContent = `${records.length} Records`;
-            const tbody = document.getElementById('graspBody');
-            
-            if (records.length === 0) {
-                tbody.innerHTML = '<tr><td colspan="8" class="no-data">No data available</td></tr>';
-                document.getElementById('graspAvgQuality').textContent = '0.00';
-                document.getElementById('graspAvgWidth').textContent = '0.00m';
-                return;
-            }
-
-            // Calculate metrics
-            const avgQuality = records.reduce((sum, r) => sum + r.quality_score, 0) / records.length;
-            const avgWidth = records.reduce((sum, r) => sum + r.grasp_width, 0) / records.length;
-
-            document.getElementById('graspAvgQuality').textContent = avgQuality.toFixed(2);
-            document.getElementById('graspAvgWidth').textContent = avgWidth.toFixed(3) + 'm';
-
-            tbody.innerHTML = records.slice(-50).reverse().map(record => `
-                <tr>
-                    <td>${record.test_id}</td>
-                    <td>${record.object_id}</td>
-                    <td class="bbox-coords">(${record.pixel_position.u}, ${record.pixel_position.v})</td>
-                    <td class="bbox-coords">(${record.world_position.x.toFixed(3)}, ${record.world_position.y.toFixed(3)}, ${record.world_position.z.toFixed(3)})</td>
-                    <td class="${getConfidenceClass(record.quality_score)}">${record.quality_score.toFixed(2)}</td>
-                    <td>${record.grasp_width.toFixed(3)}m</td>
-                    <td>${record.approach_direction}</td>
-                    <td class="timestamp">${formatTimestamp(record.timestamp)}</td>
-                </tr>
-            `).join('');
-        }
-
-        function updateSceneUnderstanding(records) {
-            document.getElementById('sceneBadge').textContent = `${records.length} Records`;
-            const tbody = document.getElementById('sceneBody');
-            
-            if (records.length === 0) {
-                tbody.innerHTML = '<tr><td colspan="7" class="no-data">No data available</td></tr>';
-                document.getElementById('sceneObjects').textContent = '0';
-                document.getElementById('sceneRelations').textContent = '0';
-                document.getElementById('sceneSpatialAcc').textContent = '0%';
-                document.getElementById('sceneAdjacencyAcc').textContent = '0%';
-                return;
-            }
-
-            // Get latest scene metrics
-            const latest = records[records.length - 1];
-            document.getElementById('sceneObjects').textContent = latest.total_objects;
-            document.getElementById('sceneRelations').textContent = latest.relations.length;
-            document.getElementById('sceneSpatialAcc').textContent = latest.spatial_accuracy.toFixed(0) + '%';
-            document.getElementById('sceneAdjacencyAcc').textContent = latest.adjacency_accuracy.toFixed(0) + '%';
-
-            tbody.innerHTML = records.slice(-20).reverse().map(record => `
-                <tr>
-                    <td>${record.scene_id}</td>
-                    <td>${record.object_labels.map(l => `<span class="object-label">${l}</span>`).join(' ')}</td>
-                    <td>
-                        <div style="max-height: 100px; overflow-y: auto; font-size: 0.85em;">
-                            ${record.relations.map(r => 
-                                `<div class="relation-text">${r.subject} ${r.relation} ${r.object} (${(r.confidence * 100).toFixed(0)}%)</div>`
-                            ).join('')}
-                        </div>
-                    </td>
-                    <td style="max-width: 300px; font-size: 0.85em;">${record.scene_description}</td>
-                    <td class="${getConfidenceClass(record.spatial_accuracy / 100)}">${record.spatial_accuracy.toFixed(0)}%</td>
-                    <td class="${getConfidenceClass(record.adjacency_accuracy / 100)}">${record.adjacency_accuracy.toFixed(0)}%</td>
-                    <td class="timestamp">${formatTimestamp(record.timestamp)}</td>
-                </tr>
-            `).join('');
-        }
-
-        function getConfidenceClass(value) {
-            if (value >= 0.7) return 'confidence-high';
-            if (value >= 0.4) return 'confidence-medium';
-            return 'confidence-low';
-        }
-
-        function formatAccuracy(value) {
-            if (value === null) return '<span style="color: #999;">N/A</span>';
-            if (value === true) return '<span class="success">✓ True</span>';
-            return '<span class="failure">✗ False</span>';
-        }
-
-        function formatTimestamp(timestamp) {
-            const date = new Date(timestamp);
-            return date.toLocaleTimeString();
-        }
-
-        async function clearData() {
-            if (confirm('Are you sure you want to clear all benchmark data?')) {
-                // This would require a service call - for now just notify user
-                alert('To clear data, run: ros2 service call /benchmark/clear_data std_srvs/srv/Trigger');
-            }
-        }
-
-        // Auto-refresh every 2 seconds
-        setInterval(fetchData, 2000);
-        
-        // Initial fetch
-        fetchData();
-    </script>
+        const latest = runs[runs.length - 1];
+        document.getElementById('rhLastObjects').textContent  = latest.scene?.total_objects  ?? '—';
+        document.getElementById('rhLastRelations').textContent= latest.scene?.total_relations ?? '—';
+        document.getElementById('rhLastLatency').textContent  =
+            latest.meta?.latency_s != null ? latest.meta.latency_s.toFixed(2) + ' s' : '—';
+
+        // Run history table
+        tbody.innerHTML = runs.slice().reverse().map(run => {
+            const meta  = run.meta  || {};
+            const sam   = run.sam   || {};
+            const clip  = run.clip  || {};
+            const scene = run.scene || {};
+            const t = meta.timestamp ? new Date(meta.timestamp).toLocaleString() : '—';
+            return `<tr>
+                <td><span class="chip chip-run">#${meta.run_no ?? '?'}</span></td>
+                <td class="ts">${t}</td>
+                <td class="mono">${meta.latency_s != null ? meta.latency_s.toFixed(2) : '—'}</td>
+                <td class="mono">${sam.total_detections ?? '—'}</td>
+                <td>${sam.avg_confidence != null ? confBar(sam.avg_confidence) : '—'}</td>
+                <td class="mono">${clip.filtered_regions ?? '—'}</td>
+                <td class="mono">${scene.total_objects   ?? '—'}</td>
+                <td class="mono">${scene.total_relations ?? '—'}</td>
+                <td class="mono">${scene.graspable_objects ?? '—'}</td>
+                <td>${chipSvc(sam.success)}</td>
+                <td>${chipSvc(clip.success)}</td>
+                <td>${chipSvc(scene.success)}</td>
+            </tr>`;
+        }).join('');
+
+        // Latest objects
+        const objects = latest.objects || [];
+        document.getElementById('latestObjectsBadge').textContent = `${objects.length} Objects`;
+        setNav('nav-objects', objects.length);
+        objBody.innerHTML = objects.length ? objects.map(obj => `<tr>
+            <td class="mono">${obj.object_id ?? '—'}</td>
+            <td><span class="chip chip-label">${obj.label ?? 'unknown'}</span></td>
+            <td class="mono" style="font-size:11px">(${obj.bbox_x1??0},${obj.bbox_y1??0})→(${obj.bbox_x2??0},${obj.bbox_y2??0})</td>
+            <td>${confBar(obj.sam_confidence)}</td>
+            <td>${confBar(obj.clip_confidence)}</td>
+            <td class="mono">${obj.distance_cm != null ? obj.distance_cm.toFixed(1) : '—'}</td>
+            <td class="mono">${obj.iou_score   != null ? obj.iou_score.toFixed(3)   : '—'}</td>
+            <td>${chipOk(obj.is_stable)}</td>
+            <td>${chipOk(obj.has_grasp)}</td>
+            <td>${obj.grasp ? confBar(obj.grasp.quality_score) : '<span style="color:var(--text-muted)">—</span>'}</td>
+        </tr>`).join('') : noObj;
+
+        // Latest relations
+        const relations = latest.relations || [];
+        document.getElementById('latestRelationsBadge').textContent = `${relations.length} Relations`;
+        setNav('nav-relations', relations.length);
+        relBody.innerHTML = relations.length ? relations.map(rel => `<tr>
+            <td><span class="chip chip-label">${rel.subject ?? ''}</span></td>
+            <td><span class="chip chip-rel">${rel.relation ?? ''}</span></td>
+            <td><span class="chip chip-label">${rel.target_object ?? ''}</span></td>
+            <td>${confBar(rel.confidence)}</td>
+            <td class="mono">${rel.distance_2d != null ? rel.distance_2d.toFixed(1) : '—'}</td>
+            <td style="font-size:12px;color:var(--text-secondary)">${rel.description ?? ''}</td>
+        </tr>`).join('') : noRel;
+    }
+
+    // ── Clear data (legacy) ───────────────────────────────────────────────────
+    async function clearData() {
+        if (confirm('Clear all in-session benchmark data?')) {
+            alert('Run:\nros2 service call /benchmark/clear_data std_srvs/srv/Trigger');
+        }
+    }
+
+    // ── Polling ───────────────────────────────────────────────────────────────
+    setInterval(fetchData,       2000);
+    setInterval(fetchRunHistory, 2000);
+    fetchData();
+    fetchRunHistory();
+</script>
 </body>
 </html>
diff --git a/docs/COLLECT_AND_EXPORT.md b/docs/COLLECT_AND_EXPORT.md
new file mode 100644
index 0000000..beb6287
--- /dev/null
+++ b/docs/COLLECT_AND_EXPORT.md
@@ -0,0 +1,264 @@
+# Vision Data Collector & Excel Exporter
+
+Runs the full SAM → CLIP → Scene Understanding pipeline **once**, stores the result in a rolling
+JSON history (last 20 runs), and writes a ready-to-open Excel workbook.
+
+---
+
+## Output Files
+
+| File | Location | Description |
+|---|---|---|
+| `vision_runs_history.json` | workspace root (next to `README.md`) | Rolling database of last 20 runs |
+| `vision_runs_export.xlsx` | workspace root | Excel workbook, 4 sheets |
+
+### Excel Sheets
+
+| Sheet | One row per | Key columns |
+|---|---|---|
+| **Runs** | Each script invocation | timestamp, total objects, graspable, avg confidence, stability %, scene description, latency |
+| **Objects** | Each detected object | CLIP label, bbox coords, SAM + CLIP confidence, distance cm, IoU score, grasp quality |
+| **Relations** | Each spatial relation | subject → relation → target, confidence, 2D distance |
+| **Grasps** | Each grasp pose | x/y/z position (m), quality score, gripper width (m) |
+
+---
+
+## Prerequisites
+
+### 1. Install openpyxl (one-time)
+
+```bash
+pip install openpyxl
+```
+
+### 2. ROS2 workspace must be built
+
+```bash
+cd ~/ros2_ws   # or wherever your workspace is
+colcon build --packages-select vision
+source install/setup.bash
+```
+
+---
+
+## How to Run
+
+### Step 1 — Start the vision nodes (separate terminals)
+
+```bash
+# Terminal 1: SAM detector (required)
+ros2 run vision simple_sam_detector
+
+# Terminal 2: CLIP classifier (required for object labels)
+ros2 run vision clip_classifier
+
+# Terminal 3: Scene understanding (required for relations + grasp data)
+ros2 run vision scene_understanding
+
+# Terminal 4: GraspNet detector (optional — needed for grasp positions)
+ros2 run vision graspnet_detector
+```
+
+Wait until you see the nodes announce their services in the terminal output before continuing.
+
+### Step 2 — Make sure a camera is publishing
+
+```bash
+# Simulation (Gazebo):
+ros2 launch ur_yt_sim spawn_ur5_camera_gripper_moveit.launch.py
+
+# Real RealSense camera:
+ros2 launch realsense2_camera rs_launch.py
+
+# Static image (for testing without hardware):
+ros2 launch vision vision_with_camera.launch.py camera_type:=file image_file:=path/to/image.jpg
+```
+
+### Step 3 — Run the collector
+
+```bash
+# Option A: directly with python3
+python3 vision_scripts/collect_and_export.py
+
+# Option B: as a ROS2 entry point (after colcon build)
+ros2 run vision collect_and_export
+```
+
+### Expected terminal output
+
+```
+============================================================
+  Vision Pipeline Data Collector & Excel Exporter
+============================================================
+  History file : /path/to/vision/vision_runs_history.json
+  Excel file   : /path/to/vision/vision_runs_export.xlsx
+  Max runs kept: 20
+============================================================
+Waiting for /vision/run_pipeline ...
+RUN #1 — Step 1: SAM /vision/run_pipeline
+  SAM: 3 objects detected
+RUN #1 — Step 2: CLIP /vision/classify_bbox_filtered
+  CLIP: 2 regions classified
+RUN #1 — Step 3: Scene /vision/understand_scene
+  Scene: 3 objects, 4 relations
+RUN #1 complete in 2.341s — 3 objects, 4 relations
+============================================================
+[OK] History saved → .../vision_runs_history.json  (1 runs stored)
+[OK] Excel exported → .../vision_runs_export.xlsx
+
+Done. Open vision_runs_export.xlsx to view results.
+```
+
+---
+
+## Run it multiple times
+
+Each time you run the script it **appends** one new entry to the JSON and **overwrites** the Excel.
+After 20 runs the oldest entry is automatically dropped.
+
+```bash
+# Run 5 times in a loop (bash)
+for i in {1..5}; do
+    python3 vision_scripts/collect_and_export.py
+    sleep 2
+done
+```
+
+---
+
+## Debugging
+
+### Problem: "service not available — skipping"
+
+The script will skip any service that does not respond within 5 seconds and
+continue with the remaining services without crashing.
+
+**Fix:** Check that the required node is running:
+
+```bash
+ros2 node list           # should show /simple_sam_detector, /clip_classifier, etc.
+ros2 service list        # should show /vision/run_pipeline, /vision/classify_bbox_filtered, etc.
+```
+
+If a node is missing, start it (see Step 1 above).
+
+---
+
+### Problem: No camera image / SAM returns 0 objects
+
+```bash
+# Check camera topics are publishing
+ros2 topic list | grep camera
+ros2 topic hz /camera/image_raw       # should show ~30 Hz
+
+# Check SAM subscriber got a frame
+ros2 topic echo /vision/status        # shows uptime and detection count
+```
+
+SAM only detects when a frame has been received. Wait a second after starting the camera before calling the collector.
+
+---
+
+### Problem: CLIP returns "No classified regions"
+
+CLIP auto-classifies when it receives a message on `/vision/sam_detections`.
+The collector calls `/vision/run_pipeline` first (which publishes to that topic), then
+waits 500 ms before calling CLIP. If CLIP is slow on first run (model loading):
+
+```bash
+# Call run_pipeline manually first to warm up CLIP
+ros2 service call /vision/run_pipeline std_srvs/srv/Trigger
+
+# Wait a few seconds, then run the collector
+python3 vision_scripts/collect_and_export.py
+```
+
+---
+
+### Problem: Scene understanding times out
+
+Scene understanding calls `/vision/detect_objects` internally which can take a few
+seconds. The collector allows **15 seconds** for it. If it still times out:
+
+```bash
+# Test scene understanding manually
+ros2 service call /vision/understand_scene std_srvs/srv/Trigger
+```
+
+If that also hangs, check that `simple_sam_detector` is running (scene understanding
+calls it internally).
+
+---
+
+### Problem: "openpyxl not installed"
+
+```bash
+pip install openpyxl
+
+# Verify:
+python3 -c "import openpyxl; print(openpyxl.__version__)"
+```
+
+The script will still save `vision_runs_history.json` even without openpyxl — only
+the Excel export is skipped.
+
+---
+
+### Problem: Excel file is open in Excel and the script fails to overwrite it
+
+Close the Excel file first, then re-run the collector.
+
+---
+
+### Inspect the raw JSON history
+
+```bash
+# Pretty-print the history file
+python3 -c "import json; print(json.dumps(json.load(open('vision_runs_history.json')), indent=2))"
+
+# Show just the run summaries
+python3 -c "
+import json
+runs = json.load(open('vision_runs_history.json'))
+for r in runs:
+    m = r['meta']; s = r['sam']; sc = r['scene']
+    print(f\"Run #{m['run_no']} | {m['timestamp']} | objects={s.get('total_detections','?')} | latency={m['latency_s']}s\")
+"
+```
+
+---
+
+### Manually clear the history
+
+```bash
+rm vision_runs_history.json
+```
+
+The next run will start fresh from run #1.
+
+---
+
+## File Structure
+
+```
+vision/
+├── vision_scripts/
+│   └── collect_and_export.py   ← the collector script
+├── vision_runs_history.json    ← created on first run
+├── vision_runs_export.xlsx     ← created on first run
+└── docs/
+    └── COLLECT_AND_EXPORT.md   ← this file
+```
+
+---
+
+## Services Called (in order)
+
+| # | Service | Type | Purpose |
+|---|---|---|---|
+| 1 | `/vision/run_pipeline` | `std_srvs/Trigger` | SAM detects objects, publishes to topic |
+| 2 | `/vision/classify_bbox_filtered` | `std_srvs/Trigger` | CLIP labels each region (conf > 0.5) |
+| 3 | `/vision/understand_scene` | `std_srvs/Trigger` | Full scene: objects + relations + grasps |
+
+If a service is not running the step is skipped and that section of the run record will show `"success": false`.
+The JSON and Excel are still saved with whatever data was collected.
diff --git a/setup.py b/setup.py
index f82099a..569de07 100644
--- a/setup.py
+++ b/setup.py
@@ -47,6 +47,7 @@
         'scipy>=1.11.0',
         'scikit-learn>=1.3.0',
         'pandas>=2.0.0',
+        'openpyxl>=3.1.0',
         'tqdm>=4.66.0',
         'jsonschema>=4.19.0',
     ],
@@ -58,6 +59,7 @@
     tests_require=['pytest'],
     entry_points={
         'console_scripts': [
+            'collect_and_export = vision_scripts.collect_and_export:main',
             'simple_sam_detector = vision.simple_sam_detector:main',
             'clip_classifier = vision.clip_classifier:main',
             'sam_clip_pipeline = vision.sam_clip_pipeline:main',
diff --git a/vision/benchmark_dashboard.py b/vision/benchmark_dashboard.py
index 3bc0459..552365c 100644
--- a/vision/benchmark_dashboard.py
+++ b/vision/benchmark_dashboard.py
@@ -356,6 +356,17 @@ def do_GET(self):
                     self.end_headers()
                     data_json = json.dumps(self.dashboard_node.data)
                     self.wfile.write(data_json.encode())
+                elif self.path == '/api/run-history':
+                    # Serve vision_runs_history.json from workspace root
+                    history_file = package_path / 'vision_runs_history.json'
+                    self.send_response(200)
+                    self.send_header('Content-type', 'application/json')
+                    self.send_header('Access-Control-Allow-Origin', '*')
+                    self.end_headers()
+                    if history_file.exists():
+                        self.wfile.write(history_file.read_bytes())
+                    else:
+                        self.wfile.write(b'[]')
                 else:
                     # Serve static files
                     super().do_GET()
diff --git a/vision_scripts/collect_and_export.py b/vision_scripts/collect_and_export.py
new file mode 100644
index 0000000..b61ae99
--- /dev/null
+++ b/vision_scripts/collect_and_export.py
@@ -0,0 +1,497 @@
+#!/usr/bin/env python3
+"""
+Vision Pipeline Data Collector & Excel Exporter
+
+Calls all 4 vision services in sequence, stores the last 20 runs in a JSON
+history file, and exports every run to an Excel workbook (4 sheets).
+
+Services called (in order):
+    1. /vision/run_pipeline          (std_srvs/Trigger)  -> SAM detects + publishes
+    2. /vision/classify_bbox_filtered (std_srvs/Trigger)  -> CLIP labels per region
+    3. /vision/understand_scene      (std_srvs/Trigger)   -> objects + relations + grasps
+
+Output files (written to workspace root next to README.md):
+    vision_runs_history.json   — rolling last-20-runs database
+    vision_runs_export.xlsx    — Excel workbook, 4 sheets:
+        • Runs      — one row per pipeline run
+        • Objects   — one row per detected object
+        • Relations — one row per spatial relation
+        • Grasps    — one row per grasp pose
+
+Usage:
+    # Make sure the vision nodes are already running, then:
+    python3 vision_scripts/collect_and_export.py
+
+    # Or as a ROS2 entry point (after colcon build):
+    ros2 run vision collect_and_export
+"""
+
+import rclpy
+from rclpy.node import Node
+from std_srvs.srv import Trigger
+import json
+import time
+import os
+import sys
+from datetime import datetime
+from pathlib import Path
+
+# ---------------------------------------------------------------------------
+# Output file paths  (workspace root = parent of this script's package dir)
+# ---------------------------------------------------------------------------
+_SCRIPT_DIR = Path(__file__).resolve().parent
+_WORKSPACE_ROOT = _SCRIPT_DIR.parent
+HISTORY_FILE = _WORKSPACE_ROOT / "vision_runs_history.json"
+EXCEL_FILE = _WORKSPACE_ROOT / "vision_runs_export.xlsx"
+MAX_HISTORY = 20
+
+
+# ---------------------------------------------------------------------------
+# Helper: load / save history
+# ---------------------------------------------------------------------------
+
+def _load_history():
+    if HISTORY_FILE.exists():
+        try:
+            with open(HISTORY_FILE, "r") as f:
+                data = json.load(f)
+            if isinstance(data, list):
+                return data
+        except Exception:
+            pass
+    return []
+
+
+def _save_history(runs):
+    runs = runs[-MAX_HISTORY:]  # keep last 20 only
+    with open(HISTORY_FILE, "w") as f:
+        json.dump(runs, f, indent=2)
+
+
+# ---------------------------------------------------------------------------
+# Helper: export to Excel using openpyxl
+# ---------------------------------------------------------------------------
+
+def _export_excel(runs):
+    """Write runs list → Excel with 4 sheets."""
+    try:
+        from openpyxl import Workbook
+        from openpyxl.styles import PatternFill, Font, Alignment
+        from openpyxl.utils import get_column_letter
+    except ImportError:
+        print("[WARN] openpyxl not installed. Run: pip install openpyxl")
+        print("[WARN] Skipping Excel export. JSON history saved successfully.")
+        return
+
+    wb = Workbook()
+
+    # ---- colour scheme ----
+    header_fill = PatternFill("solid", fgColor="4F81BD")
+    header_font = Font(bold=True, color="FFFFFF")
+    alt_fill    = PatternFill("solid", fgColor="DCE6F1")
+
+    def _write_sheet(ws, headers, rows, colour_col=None):
+        """Write header row then data rows with alternating row colour."""
+        ws.append(headers)
+        for cell in ws[1]:
+            cell.fill = header_fill
+            cell.font = header_font
+            cell.alignment = Alignment(horizontal="center")
+        for row_idx, row in enumerate(rows, start=2):
+            ws.append(row)
+            if row_idx % 2 == 0:
+                for cell in ws[row_idx]:
+                    cell.fill = alt_fill
+        # Auto-width
+        for col_idx, header in enumerate(headers, start=1):
+            col_letter = get_column_letter(col_idx)
+            max_len = len(str(header))
+            for row in ws.iter_rows(min_col=col_idx, max_col=col_idx):
+                for cell in row:
+                    try:
+                        max_len = max(max_len, len(str(cell.value or "")))
+                    except Exception:
+                        pass
+            ws.column_dimensions[col_letter].width = min(max_len + 4, 40)
+
+    # ---- Sheet 1: Runs ----
+    ws_runs = wb.active
+    ws_runs.title = "Runs"
+    runs_headers = [
+        "Run No", "Timestamp", "SAM Total Objects", "CLIP Filtered Regions",
+        "Graspable Objects", "Total Relations", "Avg SAM Confidence",
+        "Avg IoU", "Stability Rate (%)", "Scene Description",
+        "SAM Success", "CLIP Success", "Scene Success", "Latency (s)"
+    ]
+    runs_rows = []
+    for run in runs:
+        meta = run.get("meta", {})
+        sam  = run.get("sam", {})
+        clip = run.get("clip", {})
+        scene = run.get("scene", {})
+        runs_rows.append([
+            meta.get("run_no", ""),
+            meta.get("timestamp", ""),
+            sam.get("total_detections", ""),
+            clip.get("filtered_regions", ""),
+            scene.get("graspable_objects", ""),
+            scene.get("total_relations", ""),
+            sam.get("avg_confidence", ""),
+            sam.get("average_iou", ""),
+            round(sam.get("stability_rate", 0) * 100, 1),
+            scene.get("scene_description", ""),
+            sam.get("success", ""),
+            clip.get("success", ""),
+            scene.get("success", ""),
+            meta.get("latency_s", ""),
+        ])
+    _write_sheet(ws_runs, runs_headers, runs_rows)
+
+    # ---- Sheet 2: Objects ----
+    ws_obj = wb.create_sheet("Objects")
+    obj_headers = [
+        "Run No", "Timestamp", "Object ID", "CLIP Label",
+        "BBox X1", "BBox Y1", "BBox X2", "BBox Y2",
+        "SAM Confidence", "CLIP Confidence",
+        "Distance (cm)", "IoU Score", "Is Stable",
+        "Has Grasp", "Grasp Quality", "Grasp Width (m)"
+    ]
+    obj_rows = []
+    for run in runs:
+        meta  = run.get("meta", {})
+        run_no = meta.get("run_no", "")
+        ts     = meta.get("timestamp", "")
+        for obj in run.get("objects", []):
+            grasp = obj.get("grasp", {})
+            obj_rows.append([
+                run_no, ts,
+                obj.get("object_id", ""),
+                obj.get("label", ""),
+                obj.get("bbox_x1", ""), obj.get("bbox_y1", ""),
+                obj.get("bbox_x2", ""), obj.get("bbox_y2", ""),
+                obj.get("sam_confidence", ""),
+                obj.get("clip_confidence", ""),
+                obj.get("distance_cm", ""),
+                obj.get("iou_score", ""),
+                obj.get("is_stable", ""),
+                obj.get("has_grasp", ""),
+                grasp.get("quality_score", ""),
+                grasp.get("width_m", ""),
+            ])
+    _write_sheet(ws_obj, obj_headers, obj_rows)
+
+    # ---- Sheet 3: Relations ----
+    ws_rel = wb.create_sheet("Relations")
+    rel_headers = [
+        "Run No", "Timestamp", "Scene ID",
+        "Subject", "Relation", "Target Object",
+        "Confidence", "Distance 2D", "Description"
+    ]
+    rel_rows = []
+    for run in runs:
+        meta   = run.get("meta", {})
+        run_no = meta.get("run_no", "")
+        ts     = meta.get("timestamp", "")
+        scene  = run.get("scene", {})
+        scene_id = scene.get("scene_id", "")
+        for rel in run.get("relations", []):
+            rel_rows.append([
+                run_no, ts, scene_id,
+                rel.get("subject", ""),
+                rel.get("relation", ""),
+                rel.get("target_object", ""),
+                rel.get("confidence", ""),
+                rel.get("distance_2d", ""),
+                rel.get("description", ""),
+            ])
+    _write_sheet(ws_rel, rel_headers, rel_rows)
+
+    # ---- Sheet 4: Grasps ----
+    ws_grasp = wb.create_sheet("Grasps")
+    grasp_headers = [
+        "Run No", "Timestamp",
+        "Object ID", "Pos X (m)", "Pos Y (m)", "Pos Z (m)",
+        "Orient X", "Orient Y", "Orient Z", "Orient W",
+        "Quality Score", "Grasp Width (m)", "Approach Direction"
+    ]
+    grasp_rows = []
+    for run in runs:
+        meta   = run.get("meta", {})
+        run_no = meta.get("run_no", "")
+        ts     = meta.get("timestamp", "")
+        for g in run.get("grasps", []):
+            grasp_rows.append([
+                run_no, ts,
+                g.get("object_id", ""),
+                g.get("pos_x", ""), g.get("pos_y", ""), g.get("pos_z", ""),
+                g.get("orient_x", ""), g.get("orient_y", ""),
+                g.get("orient_z", ""), g.get("orient_w", ""),
+                g.get("quality_score", ""),
+                g.get("width_m", ""),
+                g.get("approach_direction", ""),
+            ])
+    _write_sheet(ws_grasp, grasp_headers, grasp_rows)
+
+    wb.save(str(EXCEL_FILE))
+    print(f"[OK] Excel exported → {EXCEL_FILE}")
+
+
+# ---------------------------------------------------------------------------
+# ROS2 collector node
+# ---------------------------------------------------------------------------
+
+class VisionDataCollector(Node):
+
+    def __init__(self):
+        super().__init__("vision_data_collector")
+
+        self._sam_client   = self.create_client(Trigger, "/vision/run_pipeline")
+        self._clip_client  = self.create_client(Trigger, "/vision/classify_bbox_filtered")
+        self._scene_client = self.create_client(Trigger, "/vision/understand_scene")
+
+    # ------------------------------------------------------------------
+    # Low-level call helper
+    # ------------------------------------------------------------------
+
+    def _call(self, client, service_name, timeout=10.0):
+        """Wait for service, call it, return (success, message_str)."""
+        self.get_logger().info(f"Waiting for {service_name} ...")
+        if not client.wait_for_service(timeout_sec=5.0):
+            self.get_logger().warn(f"{service_name} not available — skipping")
+            return False, None
+
+        future = client.call_async(Trigger.Request())
+        start = time.time()
+        while not future.done():
+            rclpy.spin_once(self, timeout_sec=0.05)
+            if time.time() - start > timeout:
+                self.get_logger().error(f"{service_name} call timed out")
+                return False, None
+
+        result = future.result()
+        if result is None:
+            return False, None
+        return result.success, result.message
+
+    # ------------------------------------------------------------------
+    # Collect one run
+    # ------------------------------------------------------------------
+
+    def collect_run(self, run_no):
+        """Call all services and return a unified run dict."""
+        ts = datetime.utcnow().isoformat() + "Z"
+        t0 = time.perf_counter()
+
+        run = {
+            "meta": {"run_no": run_no, "timestamp": ts},
+            "sam":  {"success": False},
+            "clip": {"success": False},
+            "scene": {"success": False},
+            "objects":   [],
+            "relations": [],
+            "grasps":    [],
+        }
+
+        # ---- 1. SAM ----
+        self.get_logger().info("=" * 60)
+        self.get_logger().info(f"RUN #{run_no} — Step 1: SAM /vision/run_pipeline")
+        sam_ok, sam_msg = self._call(self._sam_client, "/vision/run_pipeline")
+        if sam_ok and sam_msg:
+            try:
+                sam_data = json.loads(sam_msg)
+                summary  = sam_data.get("summary", {})
+                metrics  = sam_data.get("metrics", {})
+                coco     = metrics.get("coco_ap_style", {})
+                circ     = metrics.get("circularity_confidence", {})
+
+                run["sam"] = {
+                    "success":       True,
+                    "total_detections": summary.get("total_detections", 0),
+                    "avg_confidence":   circ.get("average_confidence", 0.0),
+                    "average_iou":      coco.get("average_iou", 0.0),
+                    "stability_rate":   coco.get("stability_rate", 0.0),
+                }
+
+                # Parse per-object data from SAM response
+                for frame in sam_data.get("detections", []):
+                    for det in frame.get("detections", []):
+                        bbox = det.get("bbox", [0, 0, 0, 0])
+                        run["objects"].append({
+                            "object_id":      det.get("class_name", "object"),
+                            "label":          "",           # filled by CLIP below
+                            "bbox_x1":        bbox[0] if len(bbox) > 0 else "",
+                            "bbox_y1":        bbox[1] if len(bbox) > 1 else "",
+                            "bbox_x2":        bbox[2] if len(bbox) > 2 else "",
+                            "bbox_y2":        bbox[3] if len(bbox) > 3 else "",
+                            "sam_confidence": det.get("confidence", ""),
+                            "clip_confidence": "",
+                            "distance_cm":    det.get("distance_cm", ""),
+                            "iou_score":      det.get("iou_with_previous", ""),
+                            "is_stable":      det.get("is_stable_detection", ""),
+                            "has_grasp":      False,
+                            "grasp":          {},
+                        })
+                self.get_logger().info(f"  SAM: {run['sam']['total_detections']} objects detected")
+            except Exception as e:
+                self.get_logger().error(f"  SAM parse error: {e}")
+
+        # Wait 500 ms for CLIP to auto-process the published SAM topic
+        time.sleep(0.5)
+
+        # ---- 2. CLIP ----
+        self.get_logger().info(f"RUN #{run_no} — Step 2: CLIP /vision/classify_bbox_filtered")
+        clip_ok, clip_msg = self._call(self._clip_client, "/vision/classify_bbox_filtered")
+        if clip_ok and clip_msg:
+            try:
+                clip_data = json.loads(clip_msg)
+                run["clip"] = {
+                    "success":          True,
+                    "total_sam_regions": clip_data.get("total_sam_regions", 0),
+                    "filtered_regions":  clip_data.get("filtered_regions", 0),
+                }
+                # Merge CLIP labels into objects by region_id index
+                clip_regions = {r["region_id"]: r for r in clip_data.get("regions", [])}
+                for idx, obj in enumerate(run["objects"]):
+                    region = clip_regions.get(idx)
+                    if region:
+                        obj["label"]           = region.get("label", "")
+                        obj["clip_confidence"] = region.get("confidence", "")
+                self.get_logger().info(f"  CLIP: {run['clip']['filtered_regions']} regions classified")
+            except Exception as e:
+                self.get_logger().error(f"  CLIP parse error: {e}")
+
+        # ---- 3. Scene Understanding ----
+        self.get_logger().info(f"RUN #{run_no} — Step 3: Scene /vision/understand_scene")
+        scene_ok, scene_msg = self._call(self._scene_client, "/vision/understand_scene", timeout=15.0)
+        if scene_ok and scene_msg:
+            try:
+                scene_data = json.loads(scene_msg)
+                run["scene"] = {
+                    "success":           True,
+                    "scene_id":          scene_data.get("scene_id", ""),
+                    "total_objects":     scene_data.get("total_objects", 0),
+                    "total_relations":   scene_data.get("total_relations", 0),
+                    "graspable_objects": scene_data.get("graspable_objects", 0),
+                    "scene_description": scene_data.get("scene_description", ""),
+                }
+
+                # Per-object details (enriches existing objects list)
+                scene_objects = scene_data.get("objects", {})
+                for obj_id, obj_info in scene_objects.items():
+                    # Try to match to an existing object entry by bounding box proximity
+                    # or append a new entry if scene understanding found it
+                    matched = False
+                    s_bbox = obj_info.get("bbox", [])
+                    for obj in run["objects"]:
+                        if (len(s_bbox) >= 4 and
+                                obj.get("bbox_x1") == s_bbox[0] and
+                                obj.get("bbox_y1") == s_bbox[1]):
+                            # Update with scene info
+                            obj["label"]    = obj.get("label") or obj_info.get("label", "")
+                            obj["has_grasp"] = obj_info.get("has_grasp", False)
+                            if obj_info.get("has_grasp") and obj_info.get("grasp_quality") is not None:
+                                obj["grasp"] = {
+                                    "quality_score": obj_info.get("grasp_quality"),
+                                    "width_m":       "",  # not available at this level
+                                }
+                            matched = True
+                            break
+
+                    if not matched:
+                        s_bbox_safe = s_bbox if len(s_bbox) >= 4 else ["", "", "", ""]
+                        run["objects"].append({
+                            "object_id":      obj_id,
+                            "label":          obj_info.get("label", ""),
+                            "bbox_x1":        s_bbox_safe[0],
+                            "bbox_y1":        s_bbox_safe[1],
+                            "bbox_x2":        s_bbox_safe[2],
+                            "bbox_y2":        s_bbox_safe[3],
+                            "sam_confidence": "",
+                            "clip_confidence": obj_info.get("confidence", ""),
+                            "distance_cm":    obj_info.get("distance_cm", ""),
+                            "iou_score":      "",
+                            "is_stable":      "",
+                            "has_grasp":      obj_info.get("has_grasp", False),
+                            "grasp": {
+                                "quality_score": obj_info.get("grasp_quality", ""),
+                                "width_m":       "",
+                            },
+                        })
+
+                    # Relations for this object
+                    for rel in obj_info.get("relations", []):
+                        run["relations"].append({
+                            "subject":       obj_id,
+                            "relation":      rel.get("relation", ""),
+                            "target_object": rel.get("target_object", ""),
+                            "confidence":    rel.get("confidence", ""),
+                            "distance_2d":   rel.get("distance_2d", ""),
+                            "description":   rel.get("description", ""),
+                        })
+
+                self.get_logger().info(
+                    f"  Scene: {run['scene']['total_objects']} objects, "
+                    f"{run['scene']['total_relations']} relations"
+                )
+            except Exception as e:
+                self.get_logger().error(f"  Scene parse error: {e}")
+
+        # ---- Finalize ----
+        run["meta"]["latency_s"] = round(time.perf_counter() - t0, 3)
+        self.get_logger().info(
+            f"RUN #{run_no} complete in {run['meta']['latency_s']}s — "
+            f"{len(run['objects'])} objects, {len(run['relations'])} relations"
+        )
+        self.get_logger().info("=" * 60)
+        return run
+
+
+# ---------------------------------------------------------------------------
+# Entry point
+# ---------------------------------------------------------------------------
+
+def main(args=None):
+    rclpy.init(args=args)
+
+    node = VisionDataCollector()
+
+    print()
+    print("=" * 60)
+    print("  Vision Pipeline Data Collector & Excel Exporter")
+    print("=" * 60)
+    print(f"  History file : {HISTORY_FILE}")
+    print(f"  Excel file   : {EXCEL_FILE}")
+    print(f"  Max runs kept: {MAX_HISTORY}")
+    print("=" * 60)
+
+    try:
+        # Determine the next run number from existing history
+        history = _load_history()
+        last_run_no = history[-1]["meta"]["run_no"] if history else 0
+        run_no = last_run_no + 1
+
+        # Collect the run
+        run = node.collect_run(run_no)
+
+        # Append to history and persist
+        history.append(run)
+        _save_history(history)
+        print(f"[OK] History saved → {HISTORY_FILE}  ({len(history[-MAX_HISTORY:])} runs stored)")
+
+        # Export all stored runs to Excel
+        _export_excel(history[-MAX_HISTORY:])
+
+        print()
+        print("Done. Open vision_runs_export.xlsx to view results.")
+        print()
+
+    except KeyboardInterrupt:
+        pass
+    finally:
+        node.destroy_node()
+        if rclpy.ok():
+            rclpy.shutdown()
+
+
+if __name__ == "__main__":
+    main()

From 0177a111bbdd83641b69b0c0fd1d4c7e48da4f89 Mon Sep 17 00:00:00 2001
From: Methasit-Pun <methasitpun@gmail.com>
Date: Sat, 4 Apr 2026 00:07:59 +0700
Subject: [PATCH 07/16] feat: add mini dashboard

---
 dashboard/index.html                 |  221 +++++-
 dashboard/objects.html               | 1049 ++++++++++++++++++++++++++
 vision_scripts/collect_and_export.py |  162 +++-
 3 files changed, 1400 insertions(+), 32 deletions(-)
 create mode 100644 dashboard/objects.html

diff --git a/dashboard/index.html b/dashboard/index.html
index 1071733..a3bd85d 100644
--- a/dashboard/index.html
+++ b/dashboard/index.html
@@ -500,6 +500,17 @@
         Pixel → Real
         <span class="sb-count" id="nav-pixel">0</span>
     </div>
+    <div class="sb-link" onclick="jumpTo('sec-obb')">
+        <div class="sb-dot" style="background:#f97316"></div>
+        OBB Angles
+        <span class="sb-count" id="nav-obb">0</span>
+    </div>
+
+    <div class="sb-group">Analysis</div>
+    <div class="sb-link" onclick="window.location.href='objects.html'">
+        <div class="sb-dot" style="background:#6366f1"></div>
+        Object Explorer
+    </div>
 </nav>
 
 <!-- ══════════════════════════════════ MAIN ═════════════════════════════════ -->
@@ -550,6 +561,11 @@
                 <div class="kpi-value" id="pixelCount">0</div>
                 <div class="kpi-label">Pixel→Real</div>
             </div>
+            <div class="kpi-card" style="--accent:#f97316">
+                <div class="kpi-value" id="obbCount">0</div>
+                <div class="kpi-label">OBB Objects</div>
+                <div class="kpi-sub">Latest run</div>
+            </div>
             <div class="kpi-card" style="--accent:#64748b">
                 <div class="kpi-value" id="totalCalls">0</div>
                 <div class="kpi-label">Total Svc Calls</div>
@@ -583,7 +599,23 @@
                 </div>
                 <div class="metric-tile">
                     <div class="metric-val" id="rhLastLatency">—</div>
-                    <div class="metric-lbl">Last Latency</div>
+                    <div class="metric-lbl">Total Latency</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="rhSamLatency">—</div>
+                    <div class="metric-lbl">SAM Latency</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="rhClipLatency">—</div>
+                    <div class="metric-lbl">CLIP Latency</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="rhSceneLatency">—</div>
+                    <div class="metric-lbl">Scene Latency</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="rhObbLatency">—</div>
+                    <div class="metric-lbl">OBB Latency</div>
                 </div>
             </div>
             <div class="table-wrap">
@@ -591,19 +623,25 @@
                     <thead><tr>
                         <th>Run</th>
                         <th>Timestamp</th>
-                        <th>Latency (s)</th>
-                        <th>SAM Detections</th>
+                        <th>Total (s)</th>
+                        <th>SAM (s)</th>
+                        <th>CLIP (s)</th>
+                        <th>Scene (s)</th>
+                        <th>OBB (s)</th>
+                        <th>SAM Objects</th>
                         <th>SAM Avg Conf</th>
                         <th>CLIP Filtered</th>
                         <th>Scene Objects</th>
                         <th>Relations</th>
                         <th>Graspable</th>
+                        <th>OBB Objects</th>
                         <th>SAM</th>
                         <th>CLIP</th>
                         <th>Scene</th>
+                        <th>OBB</th>
                     </tr></thead>
                     <tbody id="runHistoryBody">
-                        <tr class="no-data-row"><td colspan="12">No run history yet — run <code>collect_and_export.py</code></td></tr>
+                        <tr class="no-data-row"><td colspan="18">No run history yet — run <code>collect_and_export.py</code></td></tr>
                     </tbody>
                 </table>
             </div>
@@ -633,9 +671,12 @@
                         <th>Stable</th>
                         <th>Has Grasp</th>
                         <th>Grasp Quality</th>
+                        <th>OBB Angle (°)</th>
+                        <th>OBB Width (px)</th>
+                        <th>OBB Height (px)</th>
                     </tr></thead>
                     <tbody id="latestObjectsBody">
-                        <tr class="no-data-row"><td colspan="10">No data yet</td></tr>
+                        <tr class="no-data-row"><td colspan="13">No data yet</td></tr>
                     </tbody>
                 </table>
             </div>
@@ -668,6 +709,59 @@
             </div>
         </div>
 
+        <!-- ── OBB Angle Benchmark ─────────────────────────────────── -->
+        <div id="sec-obb" class="section-card">
+            <div class="section-head">
+                <div class="section-accent" style="background:#f97316"></div>
+                <div>
+                    <div class="section-title">OBB — Oriented Bounding Box Angle Benchmark</div>
+                    <div class="section-subtitle">/obb/find_object_angle · angle parallel to width · 0° = vertical · range −90° to +90°</div>
+                </div>
+                <span class="section-badge" id="obbBadge" style="background:#f97316">0 Objects</span>
+            </div>
+            <div class="metric-strip">
+                <div class="metric-tile">
+                    <div class="metric-val" id="obbTotalObjects">—</div>
+                    <div class="metric-lbl">Objects (Latest)</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="obbAvgAngle">—</div>
+                    <div class="metric-lbl">Avg Angle (°)</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="obbMinAngle">—</div>
+                    <div class="metric-lbl">Min Angle (°)</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="obbMaxAngle">—</div>
+                    <div class="metric-lbl">Max Angle (°)</div>
+                </div>
+                <div class="metric-tile">
+                    <div class="metric-val" id="obbLatency">—</div>
+                    <div class="metric-lbl">OBB Latency (s)</div>
+                </div>
+            </div>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Object ID</th>
+                        <th>Label</th>
+                        <th>OBB Angle (°)</th>
+                        <th>OBB Theta (rad)</th>
+                        <th>OBB Width (px)</th>
+                        <th>OBB Height (px)</th>
+                        <th>Center (u, v)</th>
+                        <th>Bounding Box</th>
+                        <th>SAM Confidence</th>
+                        <th>Distance (cm)</th>
+                    </tr></thead>
+                    <tbody id="obbBody">
+                        <tr class="no-data-row"><td colspan="10">No OBB data — ensure <code>obb_angle_service_node</code> is running</td></tr>
+                    </tbody>
+                </table>
+            </div>
+        </div>
+
         <!-- ── SAM ──────────────────────────────────────────────────── -->
         <div id="sec-sam" class="section-label">Service Monitor</div>
         <div class="section-card">
@@ -1138,29 +1232,45 @@
         document.getElementById('rhLastRelations').textContent= latest.scene?.total_relations ?? '—';
         document.getElementById('rhLastLatency').textContent  =
             latest.meta?.latency_s != null ? latest.meta.latency_s.toFixed(2) + ' s' : '—';
-
-        // Run history table
+        document.getElementById('rhSamLatency').textContent   =
+            latest.sam?.latency_s  != null ? latest.sam.latency_s.toFixed(2)  + ' s' : '—';
+        document.getElementById('rhClipLatency').textContent  =
+            latest.clip?.latency_s != null ? latest.clip.latency_s.toFixed(2) + ' s' : '—';
+        document.getElementById('rhSceneLatency').textContent =
+            latest.scene?.latency_s!= null ? latest.scene.latency_s.toFixed(2)+ ' s' : '—';
+        document.getElementById('rhObbLatency').textContent   =
+            latest.obb?.latency_s  != null ? latest.obb.latency_s.toFixed(2)  + ' s' : '—';
+
+        // Run history table — update to include latency per service and OBB
         tbody.innerHTML = runs.slice().reverse().map(run => {
-            const meta  = run.meta  || {};
-            const sam   = run.sam   || {};
-            const clip  = run.clip  || {};
-            const scene = run.scene || {};
-            const t = meta.timestamp ? new Date(meta.timestamp).toLocaleString() : '—';
-            return `<tr>
-                <td><span class="chip chip-run">#${meta.run_no ?? '?'}</span></td>
-                <td class="ts">${t}</td>
-                <td class="mono">${meta.latency_s != null ? meta.latency_s.toFixed(2) : '—'}</td>
-                <td class="mono">${sam.total_detections ?? '—'}</td>
-                <td>${sam.avg_confidence != null ? confBar(sam.avg_confidence) : '—'}</td>
-                <td class="mono">${clip.filtered_regions ?? '—'}</td>
-                <td class="mono">${scene.total_objects   ?? '—'}</td>
-                <td class="mono">${scene.total_relations ?? '—'}</td>
-                <td class="mono">${scene.graspable_objects ?? '—'}</td>
-                <td>${chipSvc(sam.success)}</td>
-                <td>${chipSvc(clip.success)}</td>
-                <td>${chipSvc(scene.success)}</td>
-            </tr>`;
-        }).join('');
+                const meta  = run.meta  || {};
+                const sam   = run.sam   || {};
+                const clip  = run.clip  || {};
+                const scene = run.scene || {};
+                const obb   = run.obb   || {};
+                const t = meta.timestamp ? new Date(meta.timestamp).toLocaleString() : '—';
+                const obbObjects = (run.objects || []).filter(o => o.obb_angle_deg !== '' && o.obb_angle_deg != null).length;
+                return `<tr>
+                    <td><span class="chip chip-run">#${meta.run_no ?? '?'}</span></td>
+                    <td class="ts">${t}</td>
+                    <td class="mono">${meta.latency_s  != null ? meta.latency_s.toFixed(2)  : '—'}</td>
+                    <td class="mono">${sam.latency_s   != null ? sam.latency_s.toFixed(2)   : '—'}</td>
+                    <td class="mono">${clip.latency_s  != null ? clip.latency_s.toFixed(2)  : '—'}</td>
+                    <td class="mono">${scene.latency_s != null ? scene.latency_s.toFixed(2) : '—'}</td>
+                    <td class="mono">${obb.latency_s   != null ? obb.latency_s.toFixed(2)   : '—'}</td>
+                    <td class="mono">${sam.total_detections ?? '—'}</td>
+                    <td>${sam.avg_confidence != null ? confBar(sam.avg_confidence) : '—'}</td>
+                    <td class="mono">${clip.filtered_regions ?? '—'}</td>
+                    <td class="mono">${scene.total_objects   ?? '—'}</td>
+                    <td class="mono">${scene.total_relations ?? '—'}</td>
+                    <td class="mono">${scene.graspable_objects ?? '—'}</td>
+                    <td class="mono">${obbObjects}</td>
+                    <td>${chipSvc(sam.success)}</td>
+                    <td>${chipSvc(clip.success)}</td>
+                    <td>${chipSvc(scene.success)}</td>
+                    <td>${chipSvc(obb.success)}</td>
+                </tr>`;
+            }).join('');
 
         // Latest objects
         const objects = latest.objects || [];
@@ -1177,6 +1287,9 @@
             <td>${chipOk(obj.is_stable)}</td>
             <td>${chipOk(obj.has_grasp)}</td>
             <td>${obj.grasp ? confBar(obj.grasp.quality_score) : '<span style="color:var(--text-muted)">—</span>'}</td>
+            <td class="mono" style="font-weight:600">${obj.obb_angle_deg != null && obj.obb_angle_deg !== '' ? obj.obb_angle_deg.toFixed(1) + '°' : '<span style="color:var(--text-muted)">—</span>'}</td>
+            <td class="mono">${obj.obb_width_px  != null && obj.obb_width_px  !== '' ? Math.round(obj.obb_width_px)  : '—'}</td>
+            <td class="mono">${obj.obb_height_px != null && obj.obb_height_px !== '' ? Math.round(obj.obb_height_px) : '—'}</td>
         </tr>`).join('') : noObj;
 
         // Latest relations
@@ -1191,6 +1304,60 @@
             <td class="mono">${rel.distance_2d != null ? rel.distance_2d.toFixed(1) : '—'}</td>
             <td style="font-size:12px;color:var(--text-secondary)">${rel.description ?? ''}</td>
         </tr>`).join('') : noRel;
+
+        // OBB section from latest run
+        updateOBBSection(latest);
+    }
+
+    function updateOBBSection(latestRun) {
+        const obbMeta = latestRun.obb || {};
+        const objects = (latestRun.objects || []).filter(o => o.obb_angle_deg != null && o.obb_angle_deg !== '');
+        const tbody   = document.getElementById('obbBody');
+
+        document.getElementById('obbBadge').textContent       = `${objects.length} Objects`;
+        document.getElementById('obbTotalObjects').textContent = objects.length;
+        document.getElementById('obbLatency').textContent      =
+            obbMeta.latency_s != null ? obbMeta.latency_s.toFixed(2) + ' s' : '—';
+        setNav('nav-obb', objects.length);
+        document.getElementById('obbCount').textContent = objects.length;
+
+        if (!objects.length) {
+            document.getElementById('obbAvgAngle').textContent = '—';
+            document.getElementById('obbMinAngle').textContent = '—';
+            document.getElementById('obbMaxAngle').textContent = '—';
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="10">No OBB data — ensure <code>obb_angle_service_node</code> is running</td></tr>';
+            return;
+        }
+
+        const angles = objects.map(o => o.obb_angle_deg);
+        const avg    = angles.reduce((s, v) => s + v, 0) / angles.length;
+        document.getElementById('obbAvgAngle').textContent = avg.toFixed(1) + '°';
+        document.getElementById('obbMinAngle').textContent = Math.min(...angles).toFixed(1) + '°';
+        document.getElementById('obbMaxAngle').textContent = Math.max(...angles).toFixed(1) + '°';
+
+        tbody.innerHTML = objects.map(obj => {
+            const angleDeg = obj.obb_angle_deg;
+            // Angle bar: map -90..+90 to 0..100%
+            const pct      = Math.round(((angleDeg + 90) / 180) * 100);
+            const barColor = Math.abs(angleDeg) < 20 ? 'var(--ok)' : Math.abs(angleDeg) < 60 ? 'var(--warn)' : 'var(--fail)';
+            return `<tr>
+                <td class="mono">${obj.object_id ?? '—'}</td>
+                <td><span class="chip chip-label">${obj.label ?? 'unknown'}</span></td>
+                <td>
+                    <div class="conf-bar">
+                        <div class="conf-track" style="width:80px"><div class="conf-fill" style="width:${pct}%;background:${barColor}"></div></div>
+                        <span class="conf-num" style="color:${barColor};min-width:52px">${angleDeg.toFixed(1)}°</span>
+                    </div>
+                </td>
+                <td class="mono">${obj.obb_theta_rad != null ? Number(obj.obb_theta_rad).toFixed(4) : '—'}</td>
+                <td class="mono">${obj.obb_width_px  != null ? Math.round(obj.obb_width_px)  : '—'}</td>
+                <td class="mono">${obj.obb_height_px != null ? Math.round(obj.obb_height_px) : '—'}</td>
+                <td class="mono">${obj.obb_center_u != null ? Math.round(obj.obb_center_u) : '—'}, ${obj.obb_center_v != null ? Math.round(obj.obb_center_v) : '—'}</td>
+                <td class="mono" style="font-size:11px">(${obj.bbox_x1??0},${obj.bbox_y1??0})→(${obj.bbox_x2??0},${obj.bbox_y2??0})</td>
+                <td>${confBar(obj.sam_confidence)}</td>
+                <td class="mono">${obj.distance_cm != null ? obj.distance_cm.toFixed(1) : '—'}</td>
+            </tr>`;
+        }).join('');
     }
 
     // ── Clear data (legacy) ───────────────────────────────────────────────────
diff --git a/dashboard/objects.html b/dashboard/objects.html
new file mode 100644
index 0000000..7af533a
--- /dev/null
+++ b/dashboard/objects.html
@@ -0,0 +1,1049 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Object Explorer — Vision Research Dashboard</title>
+    <style>
+        /* ── Design tokens (same palette as main dashboard) ─────────── */
+        :root {
+            --bg:            #f1f5f9;
+            --surface:       #ffffff;
+            --border:        #e2e8f0;
+            --text-primary:  #0f172a;
+            --text-secondary:#64748b;
+            --text-muted:    #94a3b8;
+
+            --color-sam:    #8b5cf6;
+            --color-clip:   #ec4899;
+            --color-grasp:  #f59e0b;
+            --color-obb:    #f97316;
+            --color-scene:  #10b981;
+            --color-obj:    #6366f1;
+
+            --ok:   #22c55e;
+            --warn: #f59e0b;
+            --fail: #ef4444;
+
+            --nav-bg:   #0f172a;
+            --nav-text: #94a3b8;
+            --radius:   10px;
+            --radius-sm:6px;
+            --shadow:   0 1px 3px rgba(0,0,0,.08);
+        }
+
+        *, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
+
+        body {
+            font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', sans-serif;
+            background: var(--bg);
+            color: var(--text-primary);
+            font-size: 13px;
+            line-height: 1.45;
+            display: flex;
+            min-height: 100vh;
+        }
+
+        /* ── Sidebar ──────────────────────────────────────────────────── */
+        #sidebar {
+            width: 226px; min-width: 226px;
+            background: var(--nav-bg);
+            position: fixed; top: 0; left: 0;
+            height: 100vh; z-index: 100;
+            display: flex; flex-direction: column;
+            overflow-y: auto;
+        }
+        .sb-brand { padding: 22px 18px 14px; border-bottom: 1px solid rgba(255,255,255,.07); }
+        .sb-brand-title { font-size: 13px; font-weight: 700; color: #fff; line-height: 1.35; }
+        .sb-brand-sub   { font-size: 11px; color: var(--nav-text); margin-top: 4px; }
+
+        .sb-group {
+            font-size: 10px; font-weight: 700; text-transform: uppercase;
+            letter-spacing: 1.1px; color: rgba(255,255,255,.22);
+            padding: 16px 18px 6px;
+        }
+        .sb-link {
+            display: flex; align-items: center; gap: 10px;
+            padding: 8px 18px; color: var(--nav-text);
+            font-size: 12.5px; font-weight: 500; cursor: pointer;
+            border-left: 3px solid transparent;
+            transition: background .12s, color .12s;
+            text-decoration: none;
+        }
+        .sb-link:hover { background: rgba(255,255,255,.06); color: #fff; }
+        .sb-link.active { border-left-color: var(--color-obj); color: #fff; background: rgba(99,102,241,.12); }
+        .sb-dot { width: 8px; height: 8px; border-radius: 50%; flex-shrink: 0; }
+        .sb-count {
+            margin-left: auto; font-size: 11px; font-weight: 600;
+            background: rgba(255,255,255,.09); padding: 1px 7px;
+            border-radius: 10px; color: rgba(255,255,255,.45);
+            min-width: 24px; text-align: center;
+        }
+
+        /* ── Main ─────────────────────────────────────────────────────── */
+        #main { margin-left: 226px; flex: 1; min-width: 0; display: flex; flex-direction: column; }
+
+        /* ── Topbar ───────────────────────────────────────────────────── */
+        #topbar {
+            background: var(--surface);
+            border-bottom: 1px solid var(--border);
+            padding: 12px 24px;
+            display: flex; align-items: center; gap: 12px;
+            position: sticky; top: 0; z-index: 90;
+            box-shadow: var(--shadow);
+            flex-wrap: wrap;
+            row-gap: 8px;
+        }
+        .tb-title { font-size: 15px; font-weight: 700; }
+        .tb-sub   { font-size: 11px; color: var(--text-secondary); margin-top: 1px; }
+
+        .ctrl-sep { width: 1px; height: 22px; background: var(--border); margin: 0 4px; }
+        .ctrl-label {
+            font-size: 10.5px; font-weight: 700; text-transform: uppercase;
+            letter-spacing: .5px; color: var(--text-secondary);
+        }
+
+        select, input[type="text"] {
+            border: 1px solid var(--border); border-radius: var(--radius-sm);
+            padding: 5px 10px; font-size: 12.5px;
+            color: var(--text-primary); background: var(--bg); outline: none;
+            transition: border .12s;
+        }
+        select:focus, input[type="text"]:focus { border-color: var(--color-obj); }
+
+        .btn {
+            padding: 5px 13px; border-radius: var(--radius-sm);
+            font-size: 12px; font-weight: 500; cursor: pointer;
+            border: 1px solid var(--border); background: var(--surface);
+            color: var(--text-secondary); transition: all .12s;
+            white-space: nowrap;
+        }
+        .btn:hover { background: var(--bg); color: var(--text-primary); }
+        .btn-primary {
+            background: var(--color-obj); color: #fff;
+            border-color: var(--color-obj);
+        }
+        .btn-primary:hover { background: #4f46e5; border-color: #4f46e5; }
+        .btn-green  { background: var(--ok); color: #fff; border-color: var(--ok); }
+        .btn-green:hover { background: #16a34a; }
+
+        .tb-right { margin-left: auto; display: flex; align-items: center; gap: 8px; flex-wrap: wrap; }
+
+        /* ── Page body ────────────────────────────────────────────────── */
+        .page-body { padding: 18px 24px; flex: 1; }
+
+        /* ── Summary pills ────────────────────────────────────────────── */
+        .summary-strip {
+            display: flex; gap: 10px; margin-bottom: 16px; flex-wrap: wrap;
+        }
+        .summary-pill {
+            background: var(--surface); border: 1px solid var(--border);
+            border-radius: 20px; padding: 5px 14px;
+            font-size: 12px; font-weight: 500;
+            display: flex; align-items: center; gap: 7px;
+        }
+        .pill-dot  { width: 7px; height: 7px; border-radius: 50%; flex-shrink: 0; }
+        .pill-val  { font-size: 15px; font-weight: 700; color: var(--text-primary); }
+        .pill-lbl  { color: var(--text-secondary); }
+
+        /* ── Section card ────────────────────────────────────────────── */
+        .section-card {
+            background: var(--surface); border: 1px solid var(--border);
+            border-radius: var(--radius); box-shadow: var(--shadow);
+            overflow: hidden;
+        }
+
+        /* ── Table ────────────────────────────────────────────────────── */
+        .table-wrap {
+            overflow: auto;
+            max-height: calc(100vh - 230px);
+        }
+        .table-wrap::-webkit-scrollbar { width: 5px; height: 5px; }
+        .table-wrap::-webkit-scrollbar-track { background: transparent; }
+        .table-wrap::-webkit-scrollbar-thumb { background: #cbd5e1; border-radius: 3px; }
+        .table-wrap::-webkit-scrollbar-thumb:hover { background: #94a3b8; }
+
+        table {
+            width: max-content;
+            min-width: 100%;
+            border-collapse: separate;
+            border-spacing: 0;
+            font-size: 12.5px;
+        }
+
+        /* Column group header row */
+        tr.cg-row th {
+            position: sticky; top: 0; z-index: 25;
+            padding: 5px 6px;
+            text-align: center;
+            font-size: 10px; font-weight: 800; text-transform: uppercase;
+            letter-spacing: .9px;
+            background: var(--surface);
+            border-bottom: 3px solid currentColor;
+            white-space: nowrap;
+        }
+        .cg-obj   { color: var(--color-obj); }
+        .cg-sam   { color: var(--color-sam); }
+        .cg-clip  { color: var(--color-clip); }
+        .cg-grasp { color: var(--color-grasp); }
+        .cg-obb   { color: var(--color-obb); }
+        .cg-scene { color: var(--color-scene); }
+
+        /* Column header row */
+        tr.ch-row th {
+            position: sticky; top: 27px; z-index: 24;
+            background: #f8fafc;
+            color: var(--text-secondary);
+            font-size: 10.5px; font-weight: 700;
+            text-transform: uppercase; letter-spacing: .6px;
+            padding: 7px 10px;
+            text-align: left;
+            border-bottom: 2px solid var(--border);
+            white-space: nowrap;
+            cursor: pointer; user-select: none;
+        }
+        tr.ch-row th:hover { background: #eef2f7; color: var(--text-primary); }
+        .sort-icon { margin-left: 3px; font-size: 9px; opacity: .35; }
+        th.sort-asc  .sort-icon,
+        th.sort-desc .sort-icon { opacity: 1; }
+
+        /* Sticky left columns */
+        .sc1 { position: sticky; left: 0;    z-index: 10; background: var(--surface); box-shadow: 2px 0 5px rgba(0,0,0,.04); min-width:148px; max-width:148px; }
+        .sc2 { position: sticky; left: 148px; z-index: 9;  background: var(--surface); min-width:96px; max-width:96px; }
+        .sc3 { position: sticky; left: 244px; z-index: 9;  background: var(--surface); min-width:56px; max-width:56px; }
+        thead .sc1 { z-index: 35; background: var(--surface); }
+        thead .sc2 { z-index: 34; background: #f8fafc; }
+        thead .sc3 { z-index: 34; background: #f8fafc; }
+        tr.cg-row .sc1 { background: var(--surface); z-index: 36; }
+
+        td {
+            padding: 9px 10px;
+            border-bottom: 1px solid #f1f5f9;
+            vertical-align: middle;
+            white-space: nowrap;
+        }
+        tbody tr:hover td { background: #fafbff; }
+        tbody tr:hover .sc1 { background: #f4f7ff; }
+        tbody tr:hover .sc2,
+        tbody tr:hover .sc3 { background: #f4f7ff; }
+
+        /* Group separator */
+        tr.group-row td {
+            background: #f8fafc;
+            border-top: 2px solid var(--border);
+            border-bottom: 1px solid var(--border);
+            padding: 5px 12px;
+            position: sticky; left: 0;
+        }
+        .group-label { font-weight: 700; font-size: 12px; color: var(--text-primary); margin-right: 10px; }
+
+        /* No data row */
+        tr.no-data td {
+            text-align: center; padding: 44px 20px;
+            color: var(--text-muted); font-style: italic;
+        }
+        tr.no-data code {
+            font-style: normal; font-size: 11.5px;
+            background: #f1f5f9; padding: 1px 6px; border-radius: 4px;
+            color: var(--text-secondary);
+        }
+
+        /* Editable name cell */
+        .name-cell { display: flex; align-items: center; gap: 5px; }
+        .name-val  { flex:1; font-weight:600; overflow:hidden; text-overflow:ellipsis; max-width:110px; }
+        .name-val.empty { color:var(--text-muted); font-weight:400; font-style:italic; }
+        .edit-btn {
+            opacity: 0; background: none; border: none; cursor: pointer;
+            font-size: 11px; color: var(--text-muted); padding: 1px 4px;
+            border-radius: 3px; transition: opacity .12s, background .12s;
+            flex-shrink: 0;
+        }
+        td:hover .edit-btn, .edit-btn:focus { opacity: 1; }
+        .edit-btn:hover { background: #f1f5f9; color: var(--color-obj); }
+        .name-input {
+            border: 1px solid var(--color-obj); border-radius: 4px;
+            padding: 3px 7px; font-size: 12px; outline: none; width: 130px;
+        }
+
+        /* Confidence bar */
+        .conf-bar  { display:flex; align-items:center; gap:5px; }
+        .conf-track{ width:42px; height:4px; background:#e2e8f0; border-radius:2px; overflow:hidden; flex-shrink:0; }
+        .conf-fill { height:100%; border-radius:2px; }
+        .cf-h { background:var(--ok); }
+        .cf-m { background:var(--warn); }
+        .cf-l { background:var(--fail); }
+        .conf-num { font-size:11.5px; font-weight:600; font-variant-numeric:tabular-nums; min-width:28px; }
+        .cn-h { color:#15803d; }
+        .cn-m { color:#92400e; }
+        .cn-l { color:#b91c1c; }
+
+        /* Angle bar (centred, -90 to +90) */
+        .ang-bar   { display:flex; align-items:center; gap:5px; }
+        .ang-track { width:50px; height:4px; background:#e2e8f0; border-radius:2px; position:relative; flex-shrink:0; }
+        .ang-mid   { position:absolute; left:50%; top:0; width:1px; height:100%; background:#94a3b8; }
+        .ang-fill  { position:absolute; top:0; height:100%; border-radius:2px; }
+
+        /* Chips */
+        .chip { display:inline-flex; align-items:center; gap:2px; padding:2px 7px; border-radius:9px; font-size:11px; font-weight:600; white-space:nowrap; }
+        .ck-ok    { background:#dcfce7; color:#15803d; }
+        .ck-fail  { background:#fee2e2; color:#dc2626; }
+        .ck-na    { background:#f1f5f9; color:#64748b; }
+        .ck-label { background:#ede9fe; color:#6d28d9; }
+        .ck-rel   { background:#ccfbf1; color:#0f766e; font-size:10.5px; }
+        .ck-run   { background:var(--bg); border:1px solid var(--border); border-radius:5px; padding:1px 7px; font-size:11.5px; font-weight:700; }
+
+        .mono { font-family:'SFMono-Regular','Consolas',monospace; }
+        .dim  { color:var(--text-muted); }
+
+        /* Relations cell */
+        .rel-cell { display:flex; flex-wrap:wrap; gap:2px; max-width:210px; }
+
+        /* Footer */
+        .footer {
+            border-top: 1px solid var(--border);
+            padding: 10px 24px;
+            font-size: 11px; color: var(--text-muted);
+            background: var(--surface);
+            display: flex; justify-content: space-between; align-items: center;
+        }
+    </style>
+</head>
+<body>
+
+<!-- ══════════════════════ SIDEBAR ══════════════════════ -->
+<nav id="sidebar">
+    <div class="sb-brand">
+        <div class="sb-brand-title">Vision Pipeline<br>Research Dashboard</div>
+        <div class="sb-brand-sub">ROS 2 · Object Explorer</div>
+    </div>
+
+    <div class="sb-group">Navigation</div>
+    <div class="sb-link" onclick="window.location.href='index.html'">
+        <div class="sb-dot" style="background:#64748b"></div>
+        ← Main Dashboard
+    </div>
+    <div class="sb-link active">
+        <div class="sb-dot" style="background:var(--color-obj)"></div>
+        Object Explorer
+    </div>
+
+    <div class="sb-group">Filters</div>
+    <div class="sb-link" onclick="setGroupBy('none')">
+        <div class="sb-dot" style="background:#64748b"></div>
+        No Grouping
+    </div>
+    <div class="sb-link" onclick="setGroupBy('label')">
+        <div class="sb-dot" style="background:var(--color-clip)"></div>
+        Group by CLIP Label
+    </div>
+    <div class="sb-link" onclick="setGroupBy('name')">
+        <div class="sb-dot" style="background:var(--color-obj)"></div>
+        Group by Assigned Name
+    </div>
+    <div class="sb-link" onclick="setGroupBy('stable')">
+        <div class="sb-dot" style="background:var(--ok)"></div>
+        Group by Stability
+    </div>
+    <div class="sb-link" onclick="setGroupBy('run')">
+        <div class="sb-dot" style="background:var(--color-sam)"></div>
+        Group by Run #
+    </div>
+
+    <div class="sb-group">Columns</div>
+    <div class="sb-link" onclick="sortByCol('sam_confidence')">
+        <div class="sb-dot" style="background:var(--color-sam)"></div>
+        Sort by SAM Conf
+    </div>
+    <div class="sb-link" onclick="sortByCol('obb_angle_deg')">
+        <div class="sb-dot" style="background:var(--color-obb)"></div>
+        Sort by OBB Angle
+    </div>
+    <div class="sb-link" onclick="sortByCol('distance_cm')">
+        <div class="sb-dot" style="background:var(--color-scene)"></div>
+        Sort by Depth
+    </div>
+    <div class="sb-link" onclick="sortByCol('grasp_quality')">
+        <div class="sb-dot" style="background:var(--color-grasp)"></div>
+        Sort by Grasp Quality
+    </div>
+</nav>
+
+<!-- ══════════════════════ MAIN ══════════════════════════ -->
+<div id="main">
+
+    <!-- Top bar -->
+    <div id="topbar">
+        <div>
+            <div class="tb-title">Object Explorer</div>
+            <div class="tb-sub">Sort · Group · Assign Names · Export  ·  data pulled from <code>vision_runs_history.json</code></div>
+        </div>
+        <div class="tb-right">
+            <span class="ctrl-label">Run</span>
+            <select id="runSelector" style="min-width:190px" onchange="buildAndRender()">
+                <option value="latest">Latest Run</option>
+            </select>
+
+            <div class="ctrl-sep"></div>
+            <span class="ctrl-label">Group</span>
+            <select id="groupBySelect" onchange="applyAndRender()">
+                <option value="none">None</option>
+                <option value="label">CLIP Label</option>
+                <option value="name">Assigned Name</option>
+                <option value="stable">Stability (AP≥0.5)</option>
+                <option value="grasp">Has Grasp</option>
+                <option value="run">Run #</option>
+            </select>
+
+            <div class="ctrl-sep"></div>
+            <input id="searchInput" type="text" placeholder="🔍  Search label, name, ID…"
+                   style="width:195px" oninput="applyAndRender()">
+
+            <div class="ctrl-sep"></div>
+            <button class="btn btn-green" onclick="exportCSV()">↓ CSV</button>
+            <button class="btn btn-primary" onclick="init()">↻ Refresh</button>
+        </div>
+    </div>
+
+    <div class="page-body">
+
+        <!-- Summary strip -->
+        <div class="summary-strip">
+            <div class="summary-pill">
+                <div class="pill-dot" style="background:var(--color-obj)"></div>
+                <span class="pill-val" id="pv-objects">0</span>
+                <span class="pill-lbl">Objects</span>
+            </div>
+            <div class="summary-pill">
+                <div class="pill-dot" style="background:var(--color-sam)"></div>
+                <span class="pill-val" id="pv-samconf">—</span>
+                <span class="pill-lbl">Avg SAM Conf</span>
+            </div>
+            <div class="summary-pill">
+                <div class="pill-dot" style="background:var(--color-clip)"></div>
+                <span class="pill-val" id="pv-labels">0</span>
+                <span class="pill-lbl">Unique Labels</span>
+            </div>
+            <div class="summary-pill">
+                <div class="pill-dot" style="background:var(--color-grasp)"></div>
+                <span class="pill-val" id="pv-graspable">0</span>
+                <span class="pill-lbl">Graspable</span>
+            </div>
+            <div class="summary-pill">
+                <div class="pill-dot" style="background:var(--color-obb)"></div>
+                <span class="pill-val" id="pv-obbavg">—</span>
+                <span class="pill-lbl">Avg OBB Angle</span>
+            </div>
+            <div class="summary-pill">
+                <div class="pill-dot" style="background:#22c55e"></div>
+                <span class="pill-val" id="pv-stable">0</span>
+                <span class="pill-lbl">Stable (AP≥0.5)</span>
+            </div>
+            <div class="summary-pill">
+                <div class="pill-dot" style="background:var(--color-scene)"></div>
+                <span class="pill-val" id="pv-rels">0</span>
+                <span class="pill-lbl">Relations</span>
+            </div>
+            <div class="summary-pill">
+                <div class="pill-dot" style="background:var(--color-obj)"></div>
+                <span class="pill-val" id="pv-named">0</span>
+                <span class="pill-lbl">Named</span>
+            </div>
+        </div>
+
+        <!-- Main table -->
+        <div class="section-card">
+            <div class="table-wrap">
+                <table id="tbl">
+                    <thead>
+                        <!-- ── Column Group Row ── -->
+                        <tr class="cg-row">
+                            <th class="sc1 cg-obj" colspan="3">Object</th>
+                            <th class="cg-sam"   colspan="6">SAM — Segment Anything Model</th>
+                            <th class="cg-clip"  colspan="3">CLIP Classification</th>
+                            <th class="cg-grasp" colspan="3">GraspNet</th>
+                            <th class="cg-obb"   colspan="4">OBB — Oriented BBox</th>
+                            <th class="cg-scene" colspan="2">Scene Understanding</th>
+                        </tr>
+                        <!-- ── Column Header Row ── -->
+                        <tr class="ch-row">
+                            <!-- Object -->
+                            <th class="sc1" data-col="assigned_name" onclick="toggleSort('assigned_name')">
+                                Assigned Name <span class="sort-icon">↕</span>
+                            </th>
+                            <th class="sc2" data-col="object_id" onclick="toggleSort('object_id')">
+                                Obj ID <span class="sort-icon">↕</span>
+                            </th>
+                            <th class="sc3" data-col="run_no" onclick="toggleSort('run_no')">
+                                Run # <span class="sort-icon">↕</span>
+                            </th>
+                            <!-- SAM -->
+                            <th>BBox (x1,y1 → x2,y2)</th>
+                            <th data-col="center_u" onclick="toggleSort('center_u')">
+                                Middle Point <span class="sort-icon">↕</span>
+                            </th>
+                            <th data-col="distance_cm" onclick="toggleSort('distance_cm')">
+                                z / Depth (cm) <span class="sort-icon">↕</span>
+                            </th>
+                            <th data-col="sam_confidence" onclick="toggleSort('sam_confidence')">
+                                Confidence <span class="sort-icon">↕</span>
+                            </th>
+                            <th data-col="iou_score" onclick="toggleSort('iou_score')">
+                                IoU Score <span class="sort-icon">↕</span>
+                            </th>
+                            <th data-col="is_stable" onclick="toggleSort('is_stable')">
+                                AP (IoU ≥ 0.5) <span class="sort-icon">↕</span>
+                            </th>
+                            <!-- CLIP -->
+                            <th data-col="label" onclick="toggleSort('label')">
+                                Label <span class="sort-icon">↕</span>
+                            </th>
+                            <th data-col="clip_confidence" onclick="toggleSort('clip_confidence')">
+                                Confidence <span class="sort-icon">↕</span>
+                            </th>
+                            <th>Top-1 Acc</th>
+                            <!-- GraspNet -->
+                            <th data-col="has_grasp" onclick="toggleSort('has_grasp')">
+                                Has Grasp <span class="sort-icon">↕</span>
+                            </th>
+                            <th data-col="grasp_quality" onclick="toggleSort('grasp_quality')">
+                                Quality (Q) <span class="sort-icon">↕</span>
+                            </th>
+                            <th data-col="grasp_width" onclick="toggleSort('grasp_width')">
+                                Width (m) <span class="sort-icon">↕</span>
+                            </th>
+                            <!-- OBB -->
+                            <th data-col="obb_angle_deg" onclick="toggleSort('obb_angle_deg')">
+                                Angle from X (°) <span class="sort-icon">↕</span>
+                            </th>
+                            <th data-col="obb_theta_rad" onclick="toggleSort('obb_theta_rad')">
+                                θ (rad) <span class="sort-icon">↕</span>
+                            </th>
+                            <th>W × H (px)</th>
+                            <th>OBB Center</th>
+                            <!-- Scene -->
+                            <th data-col="rel_count" onclick="toggleSort('rel_count')">
+                                Relations <span class="sort-icon">↕</span>
+                            </th>
+                            <th>Relation Detail</th>
+                        </tr>
+                    </thead>
+                    <tbody id="tbl-body">
+                        <tr class="no-data"><td colspan="21">Loading…</td></tr>
+                    </tbody>
+                </table>
+            </div>
+        </div>
+
+    </div><!-- /page-body -->
+
+    <div class="footer">
+        <span>Object Explorer · Vision Pipeline Research Dashboard · ROS 2</span>
+        <span id="footer-status">—</span>
+    </div>
+</div>
+
+<script>
+// ═══════════════════════════════════════════════════════════════
+//  State
+// ═══════════════════════════════════════════════════════════════
+let allRuns     = [];
+let currentRows = [];   // rows for selected run(s)
+let viewRows    = [];   // after filter + sort
+
+let sortCol = null;
+let sortDir = 'asc';
+
+const NAMES_KEY = 'vision_assigned_names';
+let assignedNames = {};
+try { assignedNames = JSON.parse(localStorage.getItem(NAMES_KEY) || '{}'); } catch(_) {}
+
+function saveName(oid, name) {
+    if (name) assignedNames[oid] = name;
+    else       delete assignedNames[oid];
+    localStorage.setItem(NAMES_KEY, JSON.stringify(assignedNames));
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Fetch
+// ═══════════════════════════════════════════════════════════════
+async function init() {
+    try {
+        const res = await fetch('/api/run-history');
+        allRuns   = await res.json();
+        populateRunSelector();
+        buildAndRender();
+        document.getElementById('footer-status').textContent =
+            `Refreshed ${new Date().toLocaleTimeString()}  ·  ${allRuns.length} run(s) in history`;
+    } catch(e) {
+        showNoData('Cannot connect to /api/run-history — start the benchmark_dashboard node first.');
+        document.getElementById('footer-status').textContent = 'Offline';
+    }
+}
+
+function populateRunSelector() {
+    const sel  = document.getElementById('runSelector');
+    const prev = sel.value;
+    sel.innerHTML = '<option value="latest">Latest Run</option><option value="all">All Runs</option>';
+    allRuns.slice().reverse().forEach(r => {
+        const m  = r.meta || {};
+        const ts = m.timestamp ? new Date(m.timestamp).toLocaleString() : '?';
+        sel.innerHTML += `<option value="${m.run_no}">Run #${m.run_no} — ${ts}</option>`;
+    });
+    try { sel.value = prev; } catch(_) {}
+}
+
+function getSelectedRuns() {
+    const v = document.getElementById('runSelector').value;
+    if (v === 'latest') return allRuns.slice(-1);
+    if (v === 'all')    return allRuns;
+    return allRuns.filter(r => String(r.meta?.run_no) === v);
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Build flat row objects from run history
+// ═══════════════════════════════════════════════════════════════
+function buildRows(runs) {
+    const rows = [];
+    for (const run of runs) {
+        const meta  = run.meta  || {};
+        const scene = run.scene || {};
+
+        // relation lookup: object_id → relation list
+        const relMap = {};
+        for (const rel of (run.relations || [])) {
+            if (!relMap[rel.subject]) relMap[rel.subject] = [];
+            relMap[rel.subject].push(rel);
+        }
+
+        for (const obj of (run.objects || [])) {
+            const oid  = obj.object_id || '';
+            const bx1  = obj.bbox_x1 != null ? +obj.bbox_x1 : null;
+            const by1  = obj.bbox_y1 != null ? +obj.bbox_y1 : null;
+            const bx2  = obj.bbox_x2 != null ? +obj.bbox_x2 : null;
+            const by2  = obj.bbox_y2 != null ? +obj.bbox_y2 : null;
+            const cu   = bx1 != null && bx2 != null ? Math.round((bx1+bx2)/2) : null;
+            const cv   = by1 != null && by2 != null ? Math.round((by1+by2)/2) : null;
+            const gq   = obj.grasp?.quality_score != null ? +obj.grasp.quality_score : null;
+            const gw   = obj.grasp?.width_m       != null ? +obj.grasp.width_m       : null;
+            const rels = relMap[oid] || [];
+
+            const toNum = v => (v !== '' && v != null) ? +v : null;
+
+            rows.push({
+                /* ─ Object ─ */
+                assigned_name:   assignedNames[oid] || '',
+                object_id:       oid,
+                run_no:          meta.run_no ?? '?',
+                timestamp:       meta.timestamp || '',
+                /* ─ SAM ─ */
+                bbox_x1:         bx1,  bbox_y1: by1,
+                bbox_x2:         bx2,  bbox_y2: by2,
+                center_u:        cu,   center_v: cv,
+                distance_cm:     obj.distance_cm    != null ? +obj.distance_cm    : null,
+                sam_confidence:  obj.sam_confidence != null ? +obj.sam_confidence : null,
+                iou_score:       obj.iou_score      != null ? +obj.iou_score      : null,
+                is_stable:       obj.is_stable ?? null,
+                /* ─ CLIP ─ */
+                label:           obj.label || '',
+                clip_confidence: obj.clip_confidence != null ? +obj.clip_confidence : null,
+                /* ─ GraspNet ─ */
+                has_grasp:       obj.has_grasp ?? false,
+                grasp_quality:   gq,
+                grasp_width:     gw,
+                /* ─ OBB ─ */
+                obb_angle_deg:   toNum(obj.obb_angle_deg),
+                obb_theta_rad:   toNum(obj.obb_theta_rad),
+                obb_width_px:    toNum(obj.obb_width_px),
+                obb_height_px:   toNum(obj.obb_height_px),
+                obb_center_u:    toNum(obj.obb_center_u),
+                obb_center_v:    toNum(obj.obb_center_v),
+                /* ─ Scene ─ */
+                relations:       rels,
+                rel_count:       rels.length,
+                scene_desc:      scene.scene_description || '',
+            });
+        }
+    }
+    return rows;
+}
+
+function buildAndRender() {
+    currentRows = buildRows(getSelectedRuns());
+    applyAndRender();
+}
+
+function applyAndRender() {
+    const q = (document.getElementById('searchInput').value || '').toLowerCase().trim();
+
+    viewRows = q
+        ? currentRows.filter(r =>
+            (r.assigned_name || '').toLowerCase().includes(q) ||
+            (r.label         || '').toLowerCase().includes(q) ||
+            (r.object_id     || '').toLowerCase().includes(q)
+          )
+        : [...currentRows];
+
+    // Sort
+    if (sortCol) {
+        viewRows.sort((a, b) => {
+            let av = a[sortCol], bv = b[sortCol];
+            if (av == null && bv == null) return 0;
+            if (av == null) return 1;
+            if (bv == null) return -1;
+            if (typeof av === 'boolean') av = av ? 1 : 0;
+            if (typeof bv === 'boolean') bv = bv ? 1 : 0;
+            return av < bv ? (sortDir==='asc'?-1:1) : av > bv ? (sortDir==='asc'?1:-1) : 0;
+        });
+    }
+
+    renderTable();
+    updateSummary();
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Render
+// ═══════════════════════════════════════════════════════════════
+function renderTable() {
+    const tbody = document.getElementById('tbl-body');
+    if (!viewRows.length) {
+        tbody.innerHTML = '<tr class="no-data"><td colspan="21">No objects match — try changing the run or clearing the search.</td></tr>';
+        return;
+    }
+
+    const groupBy = document.getElementById('groupBySelect').value;
+
+    if (groupBy === 'none') {
+        tbody.innerHTML = viewRows.map(renderRow).join('');
+        return;
+    }
+
+    const keyFn = {
+        label:  r => r.label           || '(no label)',
+        name:   r => r.assigned_name   || '(unassigned)',
+        stable: r => r.is_stable ? '✓ Stable  (AP ≥ 0.5)' : '✗ Unstable',
+        grasp:  r => r.has_grasp ? '✓ Graspable' : '✗ Not graspable',
+        run:    r => `Run #${r.run_no}`,
+    }[groupBy] || (() => 'All');
+
+    const groups = new Map();
+    for (const r of viewRows) {
+        const k = keyFn(r);
+        if (!groups.has(k)) groups.set(k, []);
+        groups.get(k).push(r);
+    }
+
+    let html = '';
+    for (const [key, gRows] of [...groups.entries()].sort(([a],[b]) => a < b ? -1 : a > b ? 1 : 0)) {
+        const graspN  = gRows.filter(r => r.has_grasp).length;
+        const confN   = gRows.filter(r => r.sam_confidence != null);
+        const avgConf = confN.length
+            ? (confN.reduce((s,r) => s + r.sam_confidence, 0) / confN.length).toFixed(3)
+            : null;
+        html += `<tr class="group-row">
+            <td colspan="21">
+                <span class="group-label">${esc(key)}</span>
+                <span class="chip ck-na">${gRows.length} obj</span>
+                ${avgConf != null ? `<span class="chip ck-na">Avg SAM ${avgConf}</span>` : ''}
+                ${graspN ? `<span class="chip ck-ok">${graspN} graspable</span>` : ''}
+            </td>
+        </tr>`;
+        html += gRows.map(renderRow).join('');
+    }
+    tbody.innerHTML = html;
+}
+
+function renderRow(r) {
+    const oid  = r.object_id;
+    const sid  = escId(oid);
+    const name = r.assigned_name || '';
+
+    // BBox string
+    const bboxStr = r.bbox_x1 != null
+        ? `(${Math.round(r.bbox_x1)},${Math.round(r.bbox_y1)})→(${Math.round(r.bbox_x2)},${Math.round(r.bbox_y2)})`
+        : null;
+
+    // Center (middle point)
+    const centerStr = r.center_u != null ? `(${r.center_u}, ${r.center_v})` : null;
+
+    return `<tr>
+        <!-- Object: Assigned Name -->
+        <td class="sc1">
+            <div class="name-cell" id="nc-${sid}">
+                <span class="name-val ${name?'':'empty'}" title="${esc(name||'Click ✏ to assign')}">${esc(name||'Assign name…')}</span>
+                <button class="edit-btn" onclick="startEdit(${JSON.stringify(oid)})" title="Edit name">✏</button>
+            </div>
+        </td>
+        <!-- Obj ID -->
+        <td class="sc2 mono" style="font-size:11px;color:var(--text-secondary)">${esc(oid)}</td>
+        <!-- Run # -->
+        <td class="sc3"><span class="chip ck-run">#${r.run_no}</span></td>
+
+        <!-- SAM: BBox -->
+        <td class="mono" style="font-size:11px">${bboxStr ?? '<span class="dim">—</span>'}</td>
+        <!-- SAM: Middle Point (center) -->
+        <td class="mono">${centerStr ?? '<span class="dim">—</span>'}</td>
+        <!-- SAM: z / Depth -->
+        <td class="mono">${r.distance_cm != null ? r.distance_cm.toFixed(1) : '<span class="dim">—</span>'}</td>
+        <!-- SAM: Confidence -->
+        <td>${confBar(r.sam_confidence)}</td>
+        <!-- SAM: IoU -->
+        <td>${confBar(r.iou_score)}</td>
+        <!-- SAM: AP (IoU>=0.5) -->
+        <td>${r.is_stable === null || r.is_stable === undefined
+                ? '<span class="chip ck-na">—</span>'
+                : r.is_stable
+                    ? '<span class="chip ck-ok">✓ Pass</span>'
+                    : '<span class="chip ck-fail">✗ Fail</span>'}</td>
+
+        <!-- CLIP: Label -->
+        <td>${r.label ? `<span class="chip ck-label">${esc(r.label)}</span>` : '<span class="dim">—</span>'}</td>
+        <!-- CLIP: Confidence -->
+        <td>${confBar(r.clip_confidence)}</td>
+        <!-- CLIP: Top-1 Acc -->
+        <td><span class="chip ck-na" title="Not stored in run history — requires benchmark_dashboard">N/A</span></td>
+
+        <!-- GraspNet: Has Grasp -->
+        <td>${r.has_grasp
+            ? '<span class="chip ck-ok">✓ Yes</span>'
+            : '<span class="chip ck-fail">✗ No</span>'}</td>
+        <!-- GraspNet: Quality -->
+        <td>${confBar(r.grasp_quality)}</td>
+        <!-- GraspNet: Width -->
+        <td class="mono">${r.grasp_width != null ? r.grasp_width.toFixed(3) + ' m' : '<span class="dim">—</span>'}</td>
+
+        <!-- OBB: Angle from X-axis -->
+        <td>${angleBar(r.obb_angle_deg)}</td>
+        <!-- OBB: θ rad -->
+        <td class="mono">${r.obb_theta_rad != null ? r.obb_theta_rad.toFixed(4) : '<span class="dim">—</span>'}</td>
+        <!-- OBB: W × H -->
+        <td class="mono">${r.obb_width_px != null
+            ? `${Math.round(r.obb_width_px)} × ${Math.round(r.obb_height_px)}`
+            : '<span class="dim">—</span>'}</td>
+        <!-- OBB: Center -->
+        <td class="mono">${r.obb_center_u != null
+            ? `(${Math.round(r.obb_center_u)}, ${Math.round(r.obb_center_v)})`
+            : '<span class="dim">—</span>'}</td>
+
+        <!-- Scene: Relation count -->
+        <td>${r.rel_count > 0
+            ? `<span class="chip ck-rel">${r.rel_count}</span>`
+            : '<span class="dim">—</span>'}</td>
+        <!-- Scene: Relation detail -->
+        <td>
+            <div class="rel-cell">
+                ${r.relations.slice(0, 3).map(rx =>
+                    `<span class="chip ck-rel" title="${esc(rx.description||'')}">${esc(rx.relation||'')} ${esc(rx.target_object||'')} <span style="opacity:.6">${rx.confidence!=null?(+rx.confidence*100).toFixed(0)+'%':''}</span></span>`
+                ).join('')}
+                ${r.relations.length > 3
+                    ? `<span class="chip ck-na" title="Click to expand (future)">+${r.relations.length-3} more</span>`
+                    : ''}
+            </div>
+        </td>
+    </tr>`;
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Visual helpers
+// ═══════════════════════════════════════════════════════════════
+function confBar(v) {
+    if (v == null) return '<span class="dim">—</span>';
+    const n   = parseFloat(v);
+    if (isNaN(n)) return '<span class="dim">—</span>';
+    const cls = n >= 0.7 ? 'h' : n >= 0.4 ? 'm' : 'l';
+    const pct = Math.min(100, Math.round(n * 100));
+    return `<div class="conf-bar">
+        <div class="conf-track"><div class="conf-fill cf-${cls}" style="width:${pct}%"></div></div>
+        <span class="conf-num cn-${cls}">${n.toFixed(2)}</span>
+    </div>`;
+}
+
+function angleBar(deg) {
+    if (deg == null) return '<span class="dim">—</span>';
+    const n = parseFloat(deg);
+    if (isNaN(n)) return '<span class="dim">—</span>';
+    // range -90 to +90, bar centred at 0
+    const clr   = Math.abs(n) < 20 ? 'var(--ok)' : Math.abs(n) < 60 ? 'var(--warn)' : 'var(--fail)';
+    const half  = 50; // 50% = center
+    const pct   = Math.abs(n) / 90 * half; // 0→50
+    const style = n >= 0
+        ? `left:${half}%;width:${pct}%;background:${clr}`
+        : `right:${half}%;width:${pct}%;left:${half - pct}%;background:${clr}`;
+    return `<div class="ang-bar">
+        <div class="ang-track">
+            <div class="ang-mid"></div>
+            <div class="ang-fill" style="${style}"></div>
+        </div>
+        <span class="conf-num" style="color:${clr};min-width:42px">${n.toFixed(1)}°</span>
+    </div>`;
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Sort
+// ═══════════════════════════════════════════════════════════════
+function toggleSort(col) {
+    if (sortCol === col) sortDir = sortDir === 'asc' ? 'desc' : 'asc';
+    else { sortCol = col; sortDir = 'asc'; }
+    refreshSortIcons();
+    applyAndRender();
+}
+function sortByCol(col) {
+    sortCol = col; sortDir = 'asc';
+    refreshSortIcons();
+    applyAndRender();
+}
+function refreshSortIcons() {
+    document.querySelectorAll('.ch-row th').forEach(th => {
+        th.classList.remove('sort-asc','sort-desc');
+        const ic = th.querySelector('.sort-icon');
+        if (ic) ic.textContent = '↕';
+    });
+    const active = document.querySelector(`.ch-row th[data-col="${sortCol}"]`);
+    if (active) {
+        active.classList.add(sortDir === 'asc' ? 'sort-asc' : 'sort-desc');
+        const ic = active.querySelector('.sort-icon');
+        if (ic) ic.textContent = sortDir === 'asc' ? '↑' : '↓';
+    }
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Inline name editing
+// ═══════════════════════════════════════════════════════════════
+function startEdit(oid) {
+    const cellDiv = document.getElementById('nc-' + escId(oid));
+    if (!cellDiv) return;
+    const cur = assignedNames[oid] || '';
+    cellDiv.innerHTML = `<input class="name-input" id="ni-${escId(oid)}"
+        type="text" value="${esc(cur)}" placeholder="Object name…"
+        maxlength="50" autocomplete="off">`;
+    const inp = document.getElementById('ni-' + escId(oid));
+    if (!inp) return;
+    inp.focus(); inp.select();
+    inp.addEventListener('blur',    () => commitEdit(oid, inp.value));
+    inp.addEventListener('keydown', e => {
+        if (e.key === 'Enter')  inp.blur();
+        if (e.key === 'Escape') { inp.value = cur; inp.blur(); }
+    });
+}
+
+function commitEdit(oid, rawName) {
+    const name = (rawName || '').trim();
+    saveName(oid, name);
+    // Update in-memory rows
+    [currentRows, viewRows].forEach(arr => {
+        arr.forEach(r => { if (r.object_id === oid) r.assigned_name = name; });
+    });
+    // Re-render that cell only
+    const cellDiv = document.getElementById('nc-' + escId(oid));
+    if (cellDiv) {
+        cellDiv.innerHTML = `
+            <span class="name-val ${name?'':'empty'}" title="${esc(name||'Click ✏ to assign')}">${esc(name||'Assign name…')}</span>
+            <button class="edit-btn" onclick="startEdit(${JSON.stringify(oid)})" title="Edit name">✏</button>`;
+    }
+    updateSummary();
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Summary pills
+// ═══════════════════════════════════════════════════════════════
+function updateSummary() {
+    const n = viewRows.length;
+    document.getElementById('pv-objects').textContent = n;
+
+    const cRows = viewRows.filter(r => r.sam_confidence != null);
+    document.getElementById('pv-samconf').textContent =
+        cRows.length ? (cRows.reduce((s,r) => s+r.sam_confidence, 0) / cRows.length).toFixed(3) : '—';
+
+    document.getElementById('pv-labels').textContent =
+        new Set(viewRows.filter(r=>r.label).map(r=>r.label)).size;
+
+    document.getElementById('pv-graspable').textContent =
+        viewRows.filter(r => r.has_grasp).length;
+
+    const oRows = viewRows.filter(r => r.obb_angle_deg != null);
+    document.getElementById('pv-obbavg').textContent =
+        oRows.length ? (oRows.reduce((s,r)=>s+r.obb_angle_deg,0)/oRows.length).toFixed(1)+'°' : '—';
+
+    document.getElementById('pv-stable').textContent =
+        viewRows.filter(r => r.is_stable === true).length;
+
+    document.getElementById('pv-rels').textContent =
+        viewRows.reduce((s,r) => s + r.rel_count, 0);
+
+    document.getElementById('pv-named').textContent =
+        viewRows.filter(r => r.assigned_name).length;
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Group-by helper (called from sidebar links)
+// ═══════════════════════════════════════════════════════════════
+function setGroupBy(val) {
+    document.getElementById('groupBySelect').value = val;
+    applyAndRender();
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Export CSV
+// ═══════════════════════════════════════════════════════════════
+function exportCSV() {
+    const hdr = [
+        'Assigned Name','Object ID','Run #','Timestamp',
+        'BBox X1','BBox Y1','BBox X2','BBox Y2',
+        'Center U (px)','Center V (px)',
+        'Depth / z (cm)',
+        'SAM Confidence','IoU Score','AP (IoU>=0.5)',
+        'CLIP Label','CLIP Confidence',
+        'Has Grasp','Grasp Quality','Grasp Width (m)',
+        'OBB Angle from X (deg)','OBB Theta (rad)',
+        'OBB Width (px)','OBB Height (px)',
+        'OBB Center U','OBB Center V',
+        'Relations Count','Relation List'
+    ];
+    const data = viewRows.map(r => [
+        r.assigned_name,       r.object_id,         r.run_no,            r.timestamp,
+        r.bbox_x1  ?? '',      r.bbox_y1  ?? '',     r.bbox_x2  ?? '',    r.bbox_y2  ?? '',
+        r.center_u ?? '',      r.center_v ?? '',
+        r.distance_cm ?? '',
+        r.sam_confidence ?? '', r.iou_score ?? '',
+        r.is_stable == null ? '' : r.is_stable,
+        r.label,               r.clip_confidence ?? '',
+        r.has_grasp,           r.grasp_quality ?? '', r.grasp_width ?? '',
+        r.obb_angle_deg ?? '',  r.obb_theta_rad ?? '',
+        r.obb_width_px  ?? '',  r.obb_height_px ?? '',
+        r.obb_center_u  ?? '',  r.obb_center_v  ?? '',
+        r.rel_count,
+        r.relations.map(x => `${x.subject} ${x.relation} ${x.target_object}`).join(' | ')
+    ].map(v => `"${String(v ?? '').replace(/"/g,'""')}"`));
+
+    const csv  = [hdr.map(h=>`"${h}"`).join(','), ...data.map(d=>d.join(','))].join('\n');
+    const blob = new Blob(['\uFEFF'+csv], {type:'text/csv;charset=utf-8;'});
+    const url  = URL.createObjectURL(blob);
+    const a    = Object.assign(document.createElement('a'), {
+        href:     url,
+        download: `vision_objects_${new Date().toISOString().slice(0,19).replace(/[T:]/g,'_')}.csv`
+    });
+    a.click();
+    URL.revokeObjectURL(url);
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Utilities
+// ═══════════════════════════════════════════════════════════════
+function esc(s) {
+    return String(s ?? '').replace(/&/g,'&amp;').replace(/</g,'&lt;').replace(/>/g,'&gt;').replace(/"/g,'&quot;');
+}
+function escId(s) {
+    return String(s ?? '').replace(/[^a-zA-Z0-9_-]/g, '_');
+}
+function showNoData(msg) {
+    document.getElementById('tbl-body').innerHTML =
+        `<tr class="no-data"><td colspan="21">${esc(msg)}</td></tr>`;
+}
+
+// ═══════════════════════════════════════════════════════════════
+//  Bootstrap
+// ═══════════════════════════════════════════════════════════════
+init();
+setInterval(init, 5000);
+</script>
+</body>
+</html>
diff --git a/vision_scripts/collect_and_export.py b/vision_scripts/collect_and_export.py
index b61ae99..35ae942 100644
--- a/vision_scripts/collect_and_export.py
+++ b/vision_scripts/collect_and_export.py
@@ -26,6 +26,7 @@
     ros2 run vision collect_and_export
 """
 
+import math
 import rclpy
 from rclpy.node import Node
 from std_srvs.srv import Trigger
@@ -36,6 +37,13 @@
 from datetime import datetime
 from pathlib import Path
 
+# OBB service uses custom_interfaces (optional — graceful skip if not built)
+try:
+    from custom_interfaces.srv import FindObjectAngle
+    _OBB_AVAILABLE = True
+except ImportError:
+    _OBB_AVAILABLE = False
+
 # ---------------------------------------------------------------------------
 # Output file paths  (workspace root = parent of this script's package dir)
 # ---------------------------------------------------------------------------
@@ -121,7 +129,9 @@ def _write_sheet(ws, headers, rows, colour_col=None):
         "Run No", "Timestamp", "SAM Total Objects", "CLIP Filtered Regions",
         "Graspable Objects", "Total Relations", "Avg SAM Confidence",
         "Avg IoU", "Stability Rate (%)", "Scene Description",
-        "SAM Success", "CLIP Success", "Scene Success", "Latency (s)"
+        "SAM Success", "CLIP Success", "Scene Success", "OBB Success",
+        "Total Latency (s)", "SAM Latency (s)", "CLIP Latency (s)",
+        "Scene Latency (s)", "OBB Latency (s)"
     ]
     runs_rows = []
     for run in runs:
@@ -129,6 +139,7 @@ def _write_sheet(ws, headers, rows, colour_col=None):
         sam  = run.get("sam", {})
         clip = run.get("clip", {})
         scene = run.get("scene", {})
+        obb   = run.get("obb", {})
         runs_rows.append([
             meta.get("run_no", ""),
             meta.get("timestamp", ""),
@@ -143,7 +154,12 @@ def _write_sheet(ws, headers, rows, colour_col=None):
             sam.get("success", ""),
             clip.get("success", ""),
             scene.get("success", ""),
+            obb.get("success", ""),
             meta.get("latency_s", ""),
+            sam.get("latency_s", ""),
+            clip.get("latency_s", ""),
+            scene.get("latency_s", ""),
+            obb.get("latency_s", ""),
         ])
     _write_sheet(ws_runs, runs_headers, runs_rows)
 
@@ -154,7 +170,11 @@ def _write_sheet(ws, headers, rows, colour_col=None):
         "BBox X1", "BBox Y1", "BBox X2", "BBox Y2",
         "SAM Confidence", "CLIP Confidence",
         "Distance (cm)", "IoU Score", "Is Stable",
-        "Has Grasp", "Grasp Quality", "Grasp Width (m)"
+        "Has Grasp", "Grasp Quality", "Grasp Width (m)",
+        # OBB columns
+        "OBB Angle (deg)", "OBB Theta (rad)",
+        "OBB Width (px)", "OBB Height (px)",
+        "OBB Center U", "OBB Center V",
     ]
     obj_rows = []
     for run in runs:
@@ -177,6 +197,13 @@ def _write_sheet(ws, headers, rows, colour_col=None):
                 obj.get("has_grasp", ""),
                 grasp.get("quality_score", ""),
                 grasp.get("width_m", ""),
+                # OBB
+                obj.get("obb_angle_deg", ""),
+                obj.get("obb_theta_rad", ""),
+                obj.get("obb_width_px",  ""),
+                obj.get("obb_height_px", ""),
+                obj.get("obb_center_u",  ""),
+                obj.get("obb_center_v",  ""),
             ])
     _write_sheet(ws_obj, obj_headers, obj_rows)
 
@@ -232,6 +259,45 @@ def _write_sheet(ws, headers, rows, colour_col=None):
             ])
     _write_sheet(ws_grasp, grasp_headers, grasp_rows)
 
+    # ---- Sheet 5: OBB Angles ----
+    ws_obb = wb.create_sheet("OBB Angles")
+    obb_headers = [
+        "Run No", "Timestamp",
+        "Object ID", "CLIP Label",
+        "OBB Angle (deg)", "OBB Theta (rad)",
+        "OBB Width (px)", "OBB Height (px)",
+        "OBB Center U", "OBB Center V",
+        "BBox X1", "BBox Y1", "BBox X2", "BBox Y2",
+        "SAM Confidence", "Distance (cm)",
+        "OBB Latency (s)",
+    ]
+    obb_rows = []
+    for run in runs:
+        meta   = run.get("meta", {})
+        run_no = meta.get("run_no", "")
+        ts     = meta.get("timestamp", "")
+        obb_lat = run.get("obb", {}).get("latency_s", "")
+        for obj in run.get("objects", []):
+            if obj.get("obb_angle_deg", "") == "":
+                continue  # skip objects where OBB wasn't available
+            obb_rows.append([
+                run_no, ts,
+                obj.get("object_id", ""),
+                obj.get("label", ""),
+                obj.get("obb_angle_deg", ""),
+                obj.get("obb_theta_rad", ""),
+                obj.get("obb_width_px",  ""),
+                obj.get("obb_height_px", ""),
+                obj.get("obb_center_u",  ""),
+                obj.get("obb_center_v",  ""),
+                obj.get("bbox_x1", ""), obj.get("bbox_y1", ""),
+                obj.get("bbox_x2", ""), obj.get("bbox_y2", ""),
+                obj.get("sam_confidence", ""),
+                obj.get("distance_cm", ""),
+                obb_lat,
+            ])
+    _write_sheet(ws_obb, obb_headers, obb_rows)
+
     wb.save(str(EXCEL_FILE))
     print(f"[OK] Excel exported → {EXCEL_FILE}")
 
@@ -249,6 +315,13 @@ def __init__(self):
         self._clip_client  = self.create_client(Trigger, "/vision/classify_bbox_filtered")
         self._scene_client = self.create_client(Trigger, "/vision/understand_scene")
 
+        # OBB client — only if custom_interfaces is built
+        if _OBB_AVAILABLE:
+            self._obb_client = self.create_client(FindObjectAngle, "/obb/find_object_angle")
+        else:
+            self._obb_client = None
+            self.get_logger().warn("custom_interfaces not found — OBB step will be skipped")
+
     # ------------------------------------------------------------------
     # Low-level call helper
     # ------------------------------------------------------------------
@@ -273,6 +346,24 @@ def _call(self, client, service_name, timeout=10.0):
             return False, None
         return result.success, result.message
 
+    def _call_obb(self, timeout=10.0):
+        """Call /obb/find_object_angle (FindObjectAngle service). Returns response or None."""
+        if self._obb_client is None:
+            return None
+        service_name = "/obb/find_object_angle"
+        self.get_logger().info(f"Waiting for {service_name} ...")
+        if not self._obb_client.wait_for_service(timeout_sec=5.0):
+            self.get_logger().warn(f"{service_name} not available — skipping OBB step")
+            return None
+        future = self._obb_client.call_async(FindObjectAngle.Request())
+        start = time.time()
+        while not future.done():
+            rclpy.spin_once(self, timeout_sec=0.05)
+            if time.time() - start > timeout:
+                self.get_logger().error(f"{service_name} call timed out")
+                return None
+        return future.result()
+
     # ------------------------------------------------------------------
     # Collect one run
     # ------------------------------------------------------------------
@@ -284,9 +375,10 @@ def collect_run(self, run_no):
 
         run = {
             "meta": {"run_no": run_no, "timestamp": ts},
-            "sam":  {"success": False},
-            "clip": {"success": False},
-            "scene": {"success": False},
+            "sam":  {"success": False, "latency_s": 0.0},
+            "clip": {"success": False, "latency_s": 0.0},
+            "scene": {"success": False, "latency_s": 0.0},
+            "obb":  {"success": False, "total_objects": 0, "latency_s": 0.0},
             "objects":   [],
             "relations": [],
             "grasps":    [],
@@ -295,7 +387,9 @@ def collect_run(self, run_no):
         # ---- 1. SAM ----
         self.get_logger().info("=" * 60)
         self.get_logger().info(f"RUN #{run_no} — Step 1: SAM /vision/run_pipeline")
+        t_sam = time.perf_counter()
         sam_ok, sam_msg = self._call(self._sam_client, "/vision/run_pipeline")
+        run["sam"]["latency_s"] = round(time.perf_counter() - t_sam, 3)
         if sam_ok and sam_msg:
             try:
                 sam_data = json.loads(sam_msg)
@@ -306,6 +400,7 @@ def collect_run(self, run_no):
 
                 run["sam"] = {
                     "success":       True,
+                    "latency_s":     run["sam"]["latency_s"],
                     "total_detections": summary.get("total_detections", 0),
                     "avg_confidence":   circ.get("average_confidence", 0.0),
                     "average_iou":      coco.get("average_iou", 0.0),
@@ -340,12 +435,15 @@ def collect_run(self, run_no):
 
         # ---- 2. CLIP ----
         self.get_logger().info(f"RUN #{run_no} — Step 2: CLIP /vision/classify_bbox_filtered")
+        t_clip = time.perf_counter()
         clip_ok, clip_msg = self._call(self._clip_client, "/vision/classify_bbox_filtered")
+        run["clip"]["latency_s"] = round(time.perf_counter() - t_clip, 3)
         if clip_ok and clip_msg:
             try:
                 clip_data = json.loads(clip_msg)
                 run["clip"] = {
                     "success":          True,
+                    "latency_s":        run["clip"]["latency_s"],
                     "total_sam_regions": clip_data.get("total_sam_regions", 0),
                     "filtered_regions":  clip_data.get("filtered_regions", 0),
                 }
@@ -362,12 +460,15 @@ def collect_run(self, run_no):
 
         # ---- 3. Scene Understanding ----
         self.get_logger().info(f"RUN #{run_no} — Step 3: Scene /vision/understand_scene")
+        t_scene = time.perf_counter()
         scene_ok, scene_msg = self._call(self._scene_client, "/vision/understand_scene", timeout=15.0)
+        run["scene"]["latency_s"] = round(time.perf_counter() - t_scene, 3)
         if scene_ok and scene_msg:
             try:
                 scene_data = json.loads(scene_msg)
                 run["scene"] = {
                     "success":           True,
+                    "latency_s":         run["scene"]["latency_s"],
                     "scene_id":          scene_data.get("scene_id", ""),
                     "total_objects":     scene_data.get("total_objects", 0),
                     "total_relations":   scene_data.get("total_relations", 0),
@@ -436,6 +537,57 @@ def collect_run(self, run_no):
             except Exception as e:
                 self.get_logger().error(f"  Scene parse error: {e}")
 
+        # ---- 4. OBB Angle Benchmark ----
+        self.get_logger().info(f"RUN #{run_no} — Step 4: OBB /obb/find_object_angle")
+        t_obb = time.perf_counter()
+        obb_resp = self._call_obb()
+        run["obb"]["latency_s"] = round(time.perf_counter() - t_obb, 3)
+
+        if obb_resp is not None and obb_resp.success:
+            run["obb"]["success"]       = True
+            run["obb"]["total_objects"] = obb_resp.total_objects
+
+            # Build a lookup: object_id -> OBB data
+            obb_by_id = {}
+            for i, oid in enumerate(obb_resp.object_ids):
+                theta_rad  = obb_resp.thetas[i]
+                # The service already stores the remapped angle (90 - geom_deg).
+                # angle_deg is directly the display angle (0° = vertical).
+                angle_deg  = math.degrees(theta_rad)
+                obb_by_id[oid] = {
+                    "obb_center_u":  obb_resp.centers_u[i],
+                    "obb_center_v":  obb_resp.centers_v[i],
+                    "obb_theta_rad": round(theta_rad, 5),
+                    "obb_angle_deg": round(angle_deg, 2),
+                    "obb_width_px":  round(obb_resp.widths[i], 2),
+                    "obb_height_px": round(obb_resp.heights[i], 2),
+                }
+
+            # Merge into existing objects list (match by object_id)
+            for obj in run["objects"]:
+                obb = obb_by_id.get(obj.get("object_id", ""))
+                if obb:
+                    obj.update(obb)
+                else:
+                    # Initialise missing OBB fields so Excel has consistent columns
+                    obj.setdefault("obb_center_u",  "")
+                    obj.setdefault("obb_center_v",  "")
+                    obj.setdefault("obb_theta_rad", "")
+                    obj.setdefault("obb_angle_deg", "")
+                    obj.setdefault("obb_width_px",  "")
+                    obj.setdefault("obb_height_px", "")
+
+            self.get_logger().info(
+                f"  OBB: {obb_resp.total_objects} objects, "
+                f"latency={run['obb']['latency_s']}s"
+            )
+        else:
+            # Ensure OBB keys exist even if service was unavailable
+            for obj in run["objects"]:
+                for k in ("obb_center_u","obb_center_v","obb_theta_rad","obb_angle_deg","obb_width_px","obb_height_px"):
+                    obj.setdefault(k, "")
+            self.get_logger().warn("  OBB: service unavailable or returned failure")
+
         # ---- Finalize ----
         run["meta"]["latency_s"] = round(time.perf_counter() - t0, 3)
         self.get_logger().info(

From 7a79158402dc36a4147e5ff39e239a5d42c78c5c Mon Sep 17 00:00:00 2001
From: Methasit-Pun <methasitpun@gmail.com>
Date: Sun, 5 Apr 2026 13:17:33 +0700
Subject: [PATCH 08/16] feat: improve intrinsic and empirical logic method

---
 vision/pixel_to_real.py | 244 +++++++++++++++++++++++-----------------
 1 file changed, 143 insertions(+), 101 deletions(-)

diff --git a/vision/pixel_to_real.py b/vision/pixel_to_real.py
index 1003e1c..43d678a 100644
--- a/vision/pixel_to_real.py
+++ b/vision/pixel_to_real.py
@@ -12,18 +12,27 @@
     float64 y   # world Y coordinate (m, positive forward/away from camera) - with -0.722m offset applied
     float64 z   # world Z coordinate (m, height above table/ground)
 
-Calibration Data:
-  - Origin (0, 0, 0.8) in world: pixel (320, 500) - bottom center of image
-  - Green box at world (0.5, 0, 0.8): pixel (320, 240)
-  - Gear part at world (0.83, 0.03, 0.8): pixel (305, 95)
-  - Drill at world (0.571546, -0.240961, 0.831898): pixel (466, 160.5)
-  - Monkey wrench at world (0.623673, 0.372909, 0.806652): pixel (150, 200)
-  - Table depth: 0.8 m from camera
-  - Coordinate mapping:
-    * u increases right → y DECREASES (u represents -y direction)
-    * v increases down → x DECREASES (v represents -x direction)
-    * x in world increases upward in image (opposite of v)
-    * y in world increases leftward in image (opposite of u)
+Calibration Method (iLogic Hybrid):
+  Linear model fitted from 22 empirical measurements (least-squares, LOO-CV RMSE ≈ 2.0 cm):
+    x =  0.00130317·u + 0.00002114·v − 0.56859693
+    y = −0.00002728·u − 0.00133088·v + 0.98011251
+
+  A Gaussian-IDW empirical correction is added on top:
+    - Problem Zone (near any of the 22 samples): correction applied → RMSE ≈ 1.5 cm
+    - Golden Zone  (far from all samples):       pure linear model used → avoids overfitting
+
+  Empirical samples (u, v → world x, y):
+    (560,362)→(0.165,0.463)  (468,452)→(0.064,0.367)
+    (334,336)→(-0.135,0.495) (241,432)→(-0.245,0.405)
+    (598,245)→(0.205,0.618)  (493,342)→(0.104,0.520)
+    (304,327)→(-0.183,0.510) (206,423)→(-0.295,0.418)
+    (587,113)→(0.195,0.810)  (490,202)→(0.090,0.715)
+    (273,111)→(-0.220,0.800) (177,206)→(-0.325,0.705)
+    (308,302)→(-0.164,0.572) (276,324)→(-0.200,0.533)
+    (555,298)→(0.145,0.576)  (456,384)→(0.040,0.482)
+    (343,284)→(-0.138,0.580) (247,375)→(-0.240,0.485)
+    (562, 85)→(0.166,0.860)  (468,173)→(0.065,0.770)
+    (202, 98)→(-0.310,0.835) (101,196)→(-0.415,0.740)
 
 Setup:
   1. Build the custom_interfaces package:
@@ -157,55 +166,55 @@ def __init__(self,
         # Publisher for debug visualization
         self.debug_pub = self.create_publisher(Image, '/pixel_to_real/debug_image', 10)
 
-        # Calibration data: pixel coordinates (u, v) -> world coordinates (x, y, z)
-        # Using calibration points:
-        # Origin: (u=320, v=500) -> (x=0, y=0, z=0.8)
-        # Green box: (u=320, v=240) -> (x=0.5, y=0, z=0.8)
-        # Gear: (u=305, v=95) -> (x=0.83, y=0.03, z=0.8)
-        
-        # Coordinate system mapping:
-        # u increases right -> y DECREASES (u represents -y direction)
-        # v increases down -> x DECREASES (v represents -x direction)
-        
-        self.u_origin = 320  # u=320 corresponds to y=0
-        self.v_origin = 500  # v=500 corresponds to x=0
-        
-        # Calculate scaling factors from calibration points:
-        # Green box: du=0, dv=-260 pixels -> dx=0.5, dy=0 meters
-        # Gear: du=-15, dv=-405 pixels -> dx=0.83, dy=0.03 meters
-        
-        # From green box (vertical movement in image):
-        # dv = 240 - 500 = -260 pixels (up in image)
-        # dx = 0.5 - 0 = 0.5 meters (positive x, which is up)
-        # scale_x = 0.5 / 260 = 0.00192 m/pixel
-        
-        # From gear (horizontal AND vertical movement):
-        # du = 305 - 320 = -15 pixels (left in image)
-        # dy = 0.03 - 0 = 0.03 meters (positive y, which is left)
-        # scale_y = 0.03 / 15 = 0.002 m/pixel
-        
-        dv_green = 240 - 500  # -260 pixels (up in image)
-        dx_green = 0.5 - 0     # 0.5 meters (positive x in world)
-        
-        du_gear = 305 - 320   # -15 pixels (left in image)
-        dy_gear = 0.03 - 0    # 0.03 meters (positive y in world)
-        
-        self.scale_x = abs(dx_green / dv_green)  # 0.5/260 = 0.00192 m/pixel
-        self.scale_y = abs(dy_gear / du_gear)    # 0.03/15 = 0.002 m/pixel
-        
-        # Depth calibration: Store reference depth for z-coordinate conversion
-        # At calibration points, z should be 0.8m (table height)
-        # We'll measure the actual depth sensor reading and use it as reference
-        self.z_table = 0.8  # World z-coordinate of table surface
-        self.depth_reference = None  # Will be set from first depth reading at calibration point
-        
-        self.get_logger().info(f'Pixel-to-world calibration: scale_x={self.scale_x:.6f} m/px, scale_y={self.scale_y:.6f} m/px')
-        self.get_logger().info(f'Origin: pixel({self.u_origin}, {self.v_origin}) -> world(0, 0, 0.8)')
-        self.get_logger().info(f'Coordinate mapping: u right=-y, v down=-x')
-        self.get_logger().info(f'Calibrated from green box at (320,240)->(0.5,0,0.8) and gear at (305,95)->(0.83,0.03,0.8)')
-        self.get_logger().info(f'Validation point: drill at (466,160)->(0.572,-0.241,0.832)')
-        self.get_logger().info(f'Validation point: monkey_wrench at (150,200)->(0.624,0.373,0.807)')
-        self.get_logger().info(f'Depth calibration: Call service at (320,240) to set depth reference for z=0.8m')
+        # ── iLogic Calibration ────────────────────────────────────────────────
+        # Linear model fitted from 22 empirical measurements (least-squares):
+        #   x =  0.00130317 * u  +0.00002114 * v  -0.56859693
+        #   y = -0.00002728 * u  -0.00133088 * v  +0.98011251
+        # LOO-CV RMSE ≈ 0.020 m
+        self.lin_cx = np.array([+0.00130317, +0.00002114, -0.56859693])  # [u, v, 1] → x
+        self.lin_cy = np.array([-0.00002728, -0.00133088, +0.98011251])  # [u, v, 1] → y
+
+        # Empirical correction table  (u, v, residual_x, residual_y)
+        # residual = true_world - linear_prediction  ← precomputed offline
+        # Used by the IDW Gaussian kernel to correct systematic lens distortion.
+        self._emp = np.array([
+            # u     v      res_x      res_y
+            [560,  362, -0.00383,  -0.02010],  # M1G_TR
+            [468,  452,  0.01316,   0.00117],  # M1G_BL
+            [334,  336, -0.00878,  -0.02882],  # M1P_TR
+            [241,  432,  0.00040,   0.00640],  # M1P_BL
+            [598,  245, -0.01089,  -0.01965],  # M2G_TR
+            [493,  342,  0.02291,   0.00854],  # M2G_BL
+            [304,  327, -0.01747,  -0.02659],  # M2P_TR
+            [206,  423, -0.00384,   0.00649],  # M2P_BL
+            [587,  113, -0.00378,  -0.00365],  # M3G_TR
+            [490,  202,  0.01584,   0.01714],  # M3G_BL
+            [273,  111, -0.00952,  -0.02493],  # M3P_TR
+            [177,  206,  0.00856,   0.00391],  # M3P_BL
+            [308,  302, -0.00316,   0.00224],  # M3X_TR
+            [276,  324,  0.00207,  -0.00836],  # M3X_BL
+            [555,  298, -0.01601,   0.00758],  # M4G_TR
+            [456,  384,  0.00623,   0.02542],  # M4G_BL
+            [343,  284, -0.02237,  -0.01282],  # M4P_TR
+            [247,  375, -0.00124,   0.01070],  # M4P_BL
+            [562,   85,  0.00041,   0.00834],  # M5G_TR
+            [468,  173,  0.02007,   0.03286],  # M5G_BL
+            [202,   98, -0.00669,  -0.00916],  # M5P_TR
+            [101,  196,  0.01778,   0.02352],  # M5P_BL
+        ], dtype=np.float64)
+        # Gaussian kernel bandwidth (pixels). Controls how far correction influence spreads.
+        self._idw_sigma = 80.0
+        # Threshold: if IDW weight-sum < this fraction of max possible, treat as Golden Zone.
+        self._golden_weight_threshold = 0.05
+
+        # Depth calibration
+        self.z_table = 0.8
+        self.depth_reference = None
+
+        self.get_logger().info('iLogic pixel-to-world: linear model + IDW empirical correction')
+        self.get_logger().info(f'  x = {self.lin_cx[0]:+.8f}*u {self.lin_cx[1]:+.8f}*v {self.lin_cx[2]:+.8f}')
+        self.get_logger().info(f'  y = {self.lin_cy[0]:+.8f}*u {self.lin_cy[1]:+.8f}*v {self.lin_cy[2]:+.8f}')
+        self.get_logger().info(f'  IDW sigma={self._idw_sigma}px  empirical samples={len(self._emp)}')
         self.get_logger().info(f'RGB topic: {self.rgb_topic}')
         self.get_logger().info(f'Depth topic: {self.depth_topic}')
         self.get_logger().info(f'Camera info topic: {self.camera_info_topic}')
@@ -213,11 +222,12 @@ def __init__(self,
 
         # Store calibration validation points for accuracy checking
         self.validation_points = [
-            {"name": "green_box", "pixel": (320, 240), "world": (0.5, 0.0, 0.8)},
-            {"name": "gear", "pixel": (305, 95), "world": (0.83, 0.03, 0.8)},
-            {"name": "drill", "pixel": (466, 160), "world": (0.571546, -0.240961, 0.831898)},
-            {"name": "monkey_wrench", "pixel": (150, 200), "world": (0.623673, 0.372909, 0.806652)},
-            {"name": "origin", "pixel": (320, 500), "world": (0.0, 0.0, 0.8)}
+            {"name": "M1G_TR",       "pixel": (560, 362), "world": ( 0.165,  0.463, 0.8)},
+            {"name": "M1P_TR",       "pixel": (334, 336), "world": (-0.135,  0.495, 0.8)},
+            {"name": "M3G_TR",       "pixel": (587, 113), "world": ( 0.195,  0.810, 0.8)},
+            {"name": "M3P_TR",       "pixel": (273, 111), "world": (-0.220,  0.800, 0.8)},
+            {"name": "M5G_TR",       "pixel": (562,  85), "world": ( 0.166,  0.860, 0.8)},
+            {"name": "M5P_TR",       "pixel": (202,  98), "world": (-0.310,  0.835, 0.8)},
         ]
 
         # TF
@@ -265,53 +275,85 @@ def depth_cb(self, msg: Image):
     def info_cb(self, msg: CameraInfo):
         self.camera_info = msg
 
+    def _idw_correction(self, u: float, v: float):
+        """iLogic: compute Gaussian-IDW empirical correction at pixel (u, v).
+
+        Golden Zone  (low influence from empirical samples) → correction ≈ 0.
+        Problem Zone (high influence near known distortion samples) → correction applied.
+
+        Returns (corr_x, corr_y, weight_sum_norm) where weight_sum_norm in [0, 1].
+        """
+        eu = self._emp[:, 0]
+        ev = self._emp[:, 1]
+        err_x = self._emp[:, 2]
+        err_y = self._emp[:, 3]
+
+        dists = np.sqrt((eu - u) ** 2 + (ev - v) ** 2)
+        weights = np.exp(-0.5 * (dists / self._idw_sigma) ** 2)
+        w_sum = weights.sum()
+
+        # Maximum possible weight_sum (if u,v were exactly on a sample point)
+        max_w_sum = len(self._emp) * 1.0  # upper bound: all weights=1
+        w_norm = w_sum / max_w_sum
+
+        if w_sum < 1e-12:
+            return 0.0, 0.0, 0.0
+
+        corr_x = float(np.dot(weights, err_x) / w_sum)
+        corr_y = float(np.dot(weights, err_y) / w_sum)
+        return corr_x, corr_y, w_norm
+
     def pixel_to_world_calibrated(self, u: int, v: int, depth_m: float):
-        """Convert pixel (u,v) to world coordinates (x,y,z) using calibration.
-        
-        Coordinate system:
-        - u increases right -> y DECREASES (u represents -y direction)
-        - v increases down -> x DECREASES (v represents -x direction)
-        - Origin at pixel (320, 500) = world (0, 0, 0.8)
-        - Depth is inversely related to z: small depth = high z (near camera, far from ground)
-        
+        """iLogic pixel → world conversion.
+
+        1. Apply the empirically fitted linear model (replaces the old 2-point
+           scale_x / scale_y formula which had large systematic errors).
+        2. Add a Gaussian-IDW empirical correction:
+             - Problem Zone (high weight from nearby samples): correction applied fully.
+             - Golden Zone  (low weight / far from all samples): correction fades to 0,
+               pure linear model used — avoids overfitting in unsampled areas.
+
         Args:
             u: pixel column (positive right)
             v: pixel row (positive down)
-            depth_m: depth in meters from camera (from depth sensor)
-            
+            depth_m: depth in meters from camera
+
         Returns:
             (x, y, z) in world coordinates (meters)
         """
-        # Calculate pixel offset from origin
-        du = u - self.u_origin  # positive = right in image
-        dv = v - self.v_origin  # positive = down in image
-        
-        # Apply transformation based on coordinate mapping:
-        # v down (-dv up) -> x increases: x = -dv * scale_x
-        # u right (-du left) -> y increases: y = -du * scale_y
-        x = -dv * self.scale_x  # Up in image -> positive x
-        y = -du * self.scale_y  # Left in image -> positive y
-        
-        # Apply y-offset for robot reference frame
-        # y = y - 0.5442  # Shift y by -0.5442 meters
-        
-        # Convert depth to z-coordinate
-        # Depth is inversely related to z: smaller depth = further from ground = higher z
-        # At table (z=0.8), we need to calibrate based on actual depth reading
-        # If depth_reference is set, use it; otherwise estimate from depth
+        # ── Step 1: Linear model (Golden Zone baseline) ───────────────────────
+        feat = np.array([u, v, 1.0])
+        x = float(np.dot(self.lin_cx, feat))
+        y = float(np.dot(self.lin_cy, feat))
+
+        # ── Step 2: iLogic empirical correction ───────────────────────────────
+        corr_x, corr_y, w_norm = self._idw_correction(float(u), float(v))
+
+        if w_norm >= self._golden_weight_threshold:
+            # Problem Zone: apply correction
+            x += corr_x
+            y += corr_y
+            zone = 'problem'
+        else:
+            # Golden Zone: trust linear model, skip correction
+            zone = 'golden'
+
+        self.get_logger().debug(
+            f'iLogic zone={zone} w_norm={w_norm:.3f} '  
+            f'corr=({corr_x:+.4f},{corr_y:+.4f}) '  
+            f'-> x={x:.4f} y={y:.4f}'
+        )
+
+        # ── Step 3: Depth → z ─────────────────────────────────────────────────
         if self.real_hardware:
-            z = depth_m  # Direct mapping for hardware
+            z = depth_m
         elif self.depth_reference is not None:
-            # z = z_table + (depth_reference - depth)
-            # When depth < depth_reference (closer to camera), z increases
-            # When depth > depth_reference (further from camera), z decreases
             z = self.z_table + (self.depth_reference - depth_m)
         else:
-            # First call: assume this is close to table depth, set reference
             self.depth_reference = depth_m
             self.get_logger().info(f'Set depth reference: {self.depth_reference:.3f}m at z={self.z_table}m')
             z = self.z_table
-        
+
         return (x, y, z)
 
     def read_depth_at(self, u: float, v: float, max_search: int = 5):
@@ -429,8 +471,8 @@ def handle_pixel_to_real(self, req, resp):
             cv2.putText(debug_img, label_depth, (u + 25, v + 5),
                        cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 255, 255), 2)
             
-            # Draw origin marker at (320, 500)
-            origin_u, origin_v = self.u_origin, self.v_origin
+            # Draw frame-centre marker (approximate optical centre)
+            origin_u, origin_v = 320, 240
             if 0 <= origin_u < debug_img.shape[1] and 0 <= origin_v < debug_img.shape[0]:
                 cv2.drawMarker(debug_img, (origin_u, origin_v), (255, 255, 0), 
                              cv2.MARKER_TILTED_CROSS, 30, 2)

From a261190a3d653e379b112ebcb2b6795c8941d03a Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Thu, 9 Apr 2026 14:15:24 +0700
Subject: [PATCH 09/16] feat: ref from previous p2r

---
 vision/pixel_to_real.py | 665 +++++++++++++---------------------------
 1 file changed, 211 insertions(+), 454 deletions(-)

diff --git a/vision/pixel_to_real.py b/vision/pixel_to_real.py
index 43d678a..3347431 100644
--- a/vision/pixel_to_real.py
+++ b/vision/pixel_to_real.py
@@ -8,46 +8,30 @@
     int32 u     # pixel column (x-coordinate, positive to the right)
     int32 v     # pixel row (y-coordinate, positive downward)
   Response:
-    float64 x   # world X coordinate (m, positive to the right)
-    float64 y   # world Y coordinate (m, positive forward/away from camera) - with -0.722m offset applied
+    float64 x   # world X coordinate (m)
+    float64 y   # world Y coordinate (m, positive forward/away from camera)
     float64 z   # world Z coordinate (m, height above table/ground)
 
-Calibration Method (iLogic Hybrid):
-  Linear model fitted from 22 empirical measurements (least-squares, LOO-CV RMSE ≈ 2.0 cm):
-    x =  0.00130317·u + 0.00002114·v − 0.56859693
-    y = −0.00002728·u − 0.00133088·v + 0.98011251
-
-  A Gaussian-IDW empirical correction is added on top:
-    - Problem Zone (near any of the 22 samples): correction applied → RMSE ≈ 1.5 cm
-    - Golden Zone  (far from all samples):       pure linear model used → avoids overfitting
-
-  Empirical samples (u, v → world x, y):
-    (560,362)→(0.165,0.463)  (468,452)→(0.064,0.367)
-    (334,336)→(-0.135,0.495) (241,432)→(-0.245,0.405)
-    (598,245)→(0.205,0.618)  (493,342)→(0.104,0.520)
-    (304,327)→(-0.183,0.510) (206,423)→(-0.295,0.418)
-    (587,113)→(0.195,0.810)  (490,202)→(0.090,0.715)
-    (273,111)→(-0.220,0.800) (177,206)→(-0.325,0.705)
-    (308,302)→(-0.164,0.572) (276,324)→(-0.200,0.533)
-    (555,298)→(0.145,0.576)  (456,384)→(0.040,0.482)
-    (343,284)→(-0.138,0.580) (247,375)→(-0.240,0.485)
-    (562, 85)→(0.166,0.860)  (468,173)→(0.065,0.770)
-    (202, 98)→(-0.310,0.835) (101,196)→(-0.415,0.740)
-
-Setup:
-  1. Build the custom_interfaces package:
-     cd ~/final_project_ws
-     colcon build --packages-select custom_interfaces
-     source install/setup.bash
-  
-  2. Build the vision package:
-     colcon build --packages-select vision --symlink-install
-     source install/setup.bash
-  
-  3. Start the pixel_to_real service node:
-     ros2 run vision pixel_to_real_service
+Calibration Methods (Hybrid):
+  METHOD 1 – Intrinsic:
+    Pinhole back-projection using camera intrinsics + known camera pose (R, t).
+    t_base_cam is the tunable offset; R_base_cam captures camera orientation.
+
+  METHOD 2 – Empirical:
+    Least-squares fit on 22 calibration points (5 measures × 2 colours × TR/BL),
+    2026-03-12, camera position [-0.0361, 0.5303, 0.6458], height 0.67 m:
+      x = -0.56859693 + 0.00130317*u + 0.00002114*v   (RMS 12.1 mm)
+      y =  0.98011251 - 0.00002728*u - 0.00133088*v   (RMS 16.9 mm)
+      2D RMSE = 20.8 mm
+
+  HYBRID:
+    Gaussian blend – empirical weighted higher near image centre (calibration
+    region), intrinsic weighted higher toward edges.
+
+Tuning:
+  • t_base_cam  – translate camera origin in base frame (x, y, z)
+  • Empirical coefficients – refit from new calibration measurements
 
-Usage:
   # Example: green box at pixel (320, 240) → world (0.5, 0.0, 0.8)
   ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 320, v: 240}"
   
@@ -66,27 +50,6 @@
   # View debug visualization:
   rqt_image_view /pixel_to_real/debug_image
 
-How it works:
-  Uses calibration points to compute a linear pixel-to-world transformation.
-  Reads depth from /camera/depth/image_raw to determine z-coordinate.
-  Shows debug visualization with pixel location and computed world coordinates.
-"""
-
-
-"""
-# linear approx. formula
-# Given pixel coordinates (u, v) and depth d from sensor:
-
-# Step 1: Calculate pixel offset from origin
-du = u - 320  # Origin u-coordinate
-dv = v - 500  # Origin v-coordinate
-
-# Step 2: Apply scaling and sign conversion
-x = -dv * 0.001923  # scale_x = 0.5/260 ≈ 0.001923 m/pixel
-y = -du * 0.002     # scale_y = 0.03/15 = 0.002 m/pixel
-
-# Step 3: Convert depth to z-coordinate
-z = 0.8 + (depth_reference - d)  # depth_reference set on first call
 
 
 """
@@ -94,446 +57,240 @@
 import rclpy
 from rclpy.node import Node
 from sensor_msgs.msg import Image, CameraInfo
-from geometry_msgs.msg import PointStamped
 from cv_bridge import CvBridge
 import numpy as np
 import math
-import tf2_ros
 import cv2
-import pyrealsense2 as rs
 
-# Replace with your actual service type. The repo often imports custom interfaces
-# from `custom_interfaces.srv`. Adjust the import if your package name differs.
+from image_geometry import PinholeCameraModel
+
 try:
     from custom_interfaces.srv import PixelToReal
 except Exception:
-    # The import may fail in editors; keep the name for when the package is built.
     PixelToReal = None
 
 
 class PixelToRealServer(Node):
-    def __init__(self,
-                 rgb_topic: str = '/camera/image_raw',
-                 depth_topic: str = '/camera/depth/image_raw',
-                 info_topic: str = '/camera/camera_info',
-                 default_target_frame: str = 'world'):
+
+    def __init__(self):
         super().__init__('pixel_to_real_server')
 
-        # Parameter toggles simulated vs hardware camera topics
-        self.declare_parameter('real_hardware', False)
+        self.declare_parameter('real_hardware', True)
         self.real_hardware = bool(self.get_parameter('real_hardware').value)
 
-        # RealSense-specific variables for hardware mode
-        self.rs_pipeline = None
-        self.rs_align = None
-        self.rs_intrinsics = None
-
         if self.real_hardware:
-            self.rgb_topic = '/camera/color/image_raw'
-            self.depth_topic = '/camera/depth/image_rect_raw'
-            self.camera_info_topic = 'camera/color/camera_info'
-            self.color_encoding = 'passthrough'
-            self.depth_32_encoding = 'passthrough'
-            self.depth_16_encoding = 'passthrough'
-            
-            # Note: We DO NOT initialize RealSense pipeline here!
-            # The camera is published by a separate node (e.g., realsense-ros)
-            # We only subscribe to the published topics
-            self.get_logger().info('Real hardware mode: subscribing to RealSense topics')
-            self.get_logger().info(f'  RGB: {self.rgb_topic}')
-            self.get_logger().info(f'  Depth: {self.depth_topic}')
-            self.get_logger().info(f'  Camera Info: {self.camera_info_topic}')
+            depth_topic      = '/camera/depth/image_rect_raw'
+            info_topic       = '/camera/color/camera_info'
+            rgb_topic        = '/camera/color/image_raw'
         else:
-            self.rgb_topic = rgb_topic or '/camera/image_raw'
-            self.depth_topic = depth_topic or '/camera/depth/image_raw'
-            self.camera_info_topic = info_topic or '/camera/camera_info'
-            self.color_encoding = 'bgr8'
-            self.depth_32_encoding = '32FC1'
-            self.depth_16_encoding = '16UC1'
-
-        self.bridge = CvBridge()
-        self.latest_rgb = None
-        self.latest_rgb_header = None
+            depth_topic      = '/camera/depth/image_raw'
+            info_topic       = '/camera/camera_info'
+            rgb_topic        = '/camera/image_raw'
+
+        self.bridge     = CvBridge()
+        self.cam_model  = PinholeCameraModel()
+
+        self.latest_rgb   = None
         self.latest_depth = None
-        self.latest_depth_header = None
-        self.camera_info = None
-        self.default_target_frame = default_target_frame
+        self.camera_ready = False
 
-        self.rgb_sub = self.create_subscription(Image, self.rgb_topic, self.rgb_cb, 10)
-        self.depth_sub = self.create_subscription(Image, self.depth_topic, self.depth_cb, 10)
-        self.info_sub = self.create_subscription(CameraInfo, self.camera_info_topic, self.info_cb, 10)
+        self.depth_sub = self.create_subscription(Image,      depth_topic, self.depth_cb, 10)
+        self.info_sub  = self.create_subscription(CameraInfo, info_topic,  self.info_cb,  10)
+        self.rgb_sub   = self.create_subscription(Image,      rgb_topic,   self.rgb_cb,   10)
 
-        # Publisher for debug visualization
         self.debug_pub = self.create_publisher(Image, '/pixel_to_real/debug_image', 10)
 
-        # ── iLogic Calibration ────────────────────────────────────────────────
-        # Linear model fitted from 22 empirical measurements (least-squares):
-        #   x =  0.00130317 * u  +0.00002114 * v  -0.56859693
-        #   y = -0.00002728 * u  -0.00133088 * v  +0.98011251
-        # LOO-CV RMSE ≈ 0.020 m
-        self.lin_cx = np.array([+0.00130317, +0.00002114, -0.56859693])  # [u, v, 1] → x
-        self.lin_cy = np.array([-0.00002728, -0.00133088, +0.98011251])  # [u, v, 1] → y
-
-        # Empirical correction table  (u, v, residual_x, residual_y)
-        # residual = true_world - linear_prediction  ← precomputed offline
-        # Used by the IDW Gaussian kernel to correct systematic lens distortion.
-        self._emp = np.array([
-            # u     v      res_x      res_y
-            [560,  362, -0.00383,  -0.02010],  # M1G_TR
-            [468,  452,  0.01316,   0.00117],  # M1G_BL
-            [334,  336, -0.00878,  -0.02882],  # M1P_TR
-            [241,  432,  0.00040,   0.00640],  # M1P_BL
-            [598,  245, -0.01089,  -0.01965],  # M2G_TR
-            [493,  342,  0.02291,   0.00854],  # M2G_BL
-            [304,  327, -0.01747,  -0.02659],  # M2P_TR
-            [206,  423, -0.00384,   0.00649],  # M2P_BL
-            [587,  113, -0.00378,  -0.00365],  # M3G_TR
-            [490,  202,  0.01584,   0.01714],  # M3G_BL
-            [273,  111, -0.00952,  -0.02493],  # M3P_TR
-            [177,  206,  0.00856,   0.00391],  # M3P_BL
-            [308,  302, -0.00316,   0.00224],  # M3X_TR
-            [276,  324,  0.00207,  -0.00836],  # M3X_BL
-            [555,  298, -0.01601,   0.00758],  # M4G_TR
-            [456,  384,  0.00623,   0.02542],  # M4G_BL
-            [343,  284, -0.02237,  -0.01282],  # M4P_TR
-            [247,  375, -0.00124,   0.01070],  # M4P_BL
-            [562,   85,  0.00041,   0.00834],  # M5G_TR
-            [468,  173,  0.02007,   0.03286],  # M5G_BL
-            [202,   98, -0.00669,  -0.00916],  # M5P_TR
-            [101,  196,  0.01778,   0.02352],  # M5P_BL
-        ], dtype=np.float64)
-        # Gaussian kernel bandwidth (pixels). Controls how far correction influence spreads.
-        self._idw_sigma = 80.0
-        # Threshold: if IDW weight-sum < this fraction of max possible, treat as Golden Zone.
-        self._golden_weight_threshold = 0.05
-
-        # Depth calibration
-        self.z_table = 0.8
-        self.depth_reference = None
-
-        self.get_logger().info('iLogic pixel-to-world: linear model + IDW empirical correction')
-        self.get_logger().info(f'  x = {self.lin_cx[0]:+.8f}*u {self.lin_cx[1]:+.8f}*v {self.lin_cx[2]:+.8f}')
-        self.get_logger().info(f'  y = {self.lin_cy[0]:+.8f}*u {self.lin_cy[1]:+.8f}*v {self.lin_cy[2]:+.8f}')
-        self.get_logger().info(f'  IDW sigma={self._idw_sigma}px  empirical samples={len(self._emp)}')
-        self.get_logger().info(f'RGB topic: {self.rgb_topic}')
-        self.get_logger().info(f'Depth topic: {self.depth_topic}')
-        self.get_logger().info(f'Camera info topic: {self.camera_info_topic}')
-        self.get_logger().info(f'real_hardware parameter: {self.real_hardware}')
-
-        # Store calibration validation points for accuracy checking
-        self.validation_points = [
-            {"name": "M1G_TR",       "pixel": (560, 362), "world": ( 0.165,  0.463, 0.8)},
-            {"name": "M1P_TR",       "pixel": (334, 336), "world": (-0.135,  0.495, 0.8)},
-            {"name": "M3G_TR",       "pixel": (587, 113), "world": ( 0.195,  0.810, 0.8)},
-            {"name": "M3P_TR",       "pixel": (273, 111), "world": (-0.220,  0.800, 0.8)},
-            {"name": "M5G_TR",       "pixel": (562,  85), "world": ( 0.166,  0.860, 0.8)},
-            {"name": "M5P_TR",       "pixel": (202,  98), "world": (-0.310,  0.835, 0.8)},
-        ]
-
-        # TF
-        self.tf_buffer = tf2_ros.Buffer()
-        self.tf_listener = tf2_ros.TransformListener(self.tf_buffer, self)
-
-        # Create service
+        # ── Depth scale (16UC1 → metres) ─────────────────────────────────────
+        self.depth_scale = 0.001   # mm → m
+
+        # ── METHOD 1: Camera pose in base_link ───────────────────────────────
+        # t_base_cam  : camera origin expressed in base frame  ← TUNE THIS
+        # R_base_cam  : rotation that maps camera axes to base axes
+        #               (camera Z forward → base -Z, camera Y down → base -Y)
+        self.t_base_cam = np.array([-0.146, 0.635, 0.8])   # <-- adjust here
+
+        self.R_base_cam = np.array([
+            [ 1.0,  0.0,  0.0],
+            [ 0.0, -1.0,  0.0],
+            [ 0.0,  0.0, -1.0],
+        ])
+
+        # ── METHOD 2: Empirical linear model ─────────────────────────────────
+        # Least-squares fit on 22 calibration points (5 measures × 2 colours
+        # × TR/BL), 2026-03-12.  Model:  x = a0 + a1*u + a2*v
+        #                                y = b0 + b1*u + b2*v
+        # 2D RMSE = 20.8 mm  (x: 12.1 mm, y: 16.9 mm)
+        self._emp_ax = np.array([-0.56859693, +0.00130317, +0.00002114])  # [1,u,v]→x
+        self._emp_ay = np.array([+0.98011251, -0.00002728, -0.00133088])  # [1,u,v]→y
+        self._emp_z  = -0.002   # table height assumption (m)
+
+        # ── Hybrid blend parameters ───────────────────────────────────────────
+        # Empirical is most accurate near image centre (calibration region).
+        # Gaussian decay controls how quickly we trust intrinsics at the edges.
+        self._image_center    = (320, 240)   # (u_c, v_c)
+        self._blend_sigma_frac = 0.6         # fraction of max diagonal for σ
+
         if PixelToReal is not None:
-            self.srv = self.create_service(PixelToReal, 'pixel_to_real', self.handle_pixel_to_real)
-            self.get_logger().info('Service /pixel_to_real ready (custom_interfaces.srv.PixelToReal)')
-            self.get_logger().info('Usage: ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 320, v: 240}"')
+            self.srv = self.create_service(
+                PixelToReal, '/pixel_to_real', self.handle_pixel_to_real
+            )
+            self.get_logger().info('Service /pixel_to_real ready')
         else:
-            self.get_logger().error('PixelToReal srv type not found!')
-            self.get_logger().error('Build custom_interfaces: colcon build --packages-select custom_interfaces')
+            self.get_logger().error(
+                'PixelToReal srv not found – build custom_interfaces first.'
+            )
             raise RuntimeError('custom_interfaces.srv.PixelToReal not available')
 
+        self.get_logger().info(
+            f't_base_cam = {self.t_base_cam.tolist()}   '
+            f'real_hardware={self.real_hardware}'
+        )
+
+    # ── Callbacks ─────────────────────────────────────────────────────────────
+
     def rgb_cb(self, msg: Image):
-        """Store the latest RGB image for pixel coordinate validation."""
         try:
-            rgb_img = self.bridge.imgmsg_to_cv2(msg, desired_encoding=self.color_encoding)
-            self.latest_rgb = rgb_img
-            self.latest_rgb_header = msg.header
+            self.latest_rgb = self.bridge.imgmsg_to_cv2(msg, 'bgr8')
         except Exception as e:
-            self.get_logger().error(f"Failed to convert RGB image: {e}")
+            self.get_logger().error(f'RGB convert error: {e}')
 
     def depth_cb(self, msg: Image):
-        # Support 32FC1 and 16UC1 encodings; convert to float32 meters.
         try:
-            if msg.encoding == '32FC1' or msg.encoding == '32F':
-                depth_img = self.bridge.imgmsg_to_cv2(msg, desired_encoding=self.depth_32_encoding)
-                depth = depth_img.astype(np.float32)
-            elif msg.encoding == '16UC1' or msg.encoding == '16U':
-                d16 = self.bridge.imgmsg_to_cv2(msg, desired_encoding=self.depth_16_encoding)
-                depth = d16.astype(np.float32) / 1000.0  # assume mm -> m
+            if msg.encoding in ('16UC1', '16U'):
+                raw = self.bridge.imgmsg_to_cv2(msg, 'passthrough')
+                self.latest_depth = raw.astype(np.float32) * self.depth_scale
+            elif msg.encoding in ('32FC1', '32F'):
+                self.latest_depth = self.bridge.imgmsg_to_cv2(
+                    msg, 'passthrough'
+                ).astype(np.float32)
             else:
-                # Try a generic conversion to float32
-                depth_img = self.bridge.imgmsg_to_cv2(msg, desired_encoding='passthrough')
-                depth = depth_img.astype(np.float32)
-
-            self.latest_depth = depth
-            self.latest_depth_header = msg.header
+                raw = self.bridge.imgmsg_to_cv2(msg, 'passthrough')
+                self.latest_depth = raw.astype(np.float32)
         except Exception as e:
-            self.get_logger().error(f"Failed to convert depth image: {e}")
+            self.get_logger().error(f'Depth convert error: {e}')
 
     def info_cb(self, msg: CameraInfo):
-        self.camera_info = msg
-
-    def _idw_correction(self, u: float, v: float):
-        """iLogic: compute Gaussian-IDW empirical correction at pixel (u, v).
+        self.cam_model.fromCameraInfo(msg)
+        self.camera_ready = True
 
-        Golden Zone  (low influence from empirical samples) → correction ≈ 0.
-        Problem Zone (high influence near known distortion samples) → correction applied.
+    # ── Depth reading ──────────────────────────────────────────────────────────
 
-        Returns (corr_x, corr_y, weight_sum_norm) where weight_sum_norm in [0, 1].
-        """
-        eu = self._emp[:, 0]
-        ev = self._emp[:, 1]
-        err_x = self._emp[:, 2]
-        err_y = self._emp[:, 3]
-
-        dists = np.sqrt((eu - u) ** 2 + (ev - v) ** 2)
-        weights = np.exp(-0.5 * (dists / self._idw_sigma) ** 2)
-        w_sum = weights.sum()
-
-        # Maximum possible weight_sum (if u,v were exactly on a sample point)
-        max_w_sum = len(self._emp) * 1.0  # upper bound: all weights=1
-        w_norm = w_sum / max_w_sum
-
-        if w_sum < 1e-12:
-            return 0.0, 0.0, 0.0
-
-        corr_x = float(np.dot(weights, err_x) / w_sum)
-        corr_y = float(np.dot(weights, err_y) / w_sum)
-        return corr_x, corr_y, w_norm
-
-    def pixel_to_world_calibrated(self, u: int, v: int, depth_m: float):
-        """iLogic pixel → world conversion.
-
-        1. Apply the empirically fitted linear model (replaces the old 2-point
-           scale_x / scale_y formula which had large systematic errors).
-        2. Add a Gaussian-IDW empirical correction:
-             - Problem Zone (high weight from nearby samples): correction applied fully.
-             - Golden Zone  (low weight / far from all samples): correction fades to 0,
-               pure linear model used — avoids overfitting in unsampled areas.
-
-        Args:
-            u: pixel column (positive right)
-            v: pixel row (positive down)
-            depth_m: depth in meters from camera
-
-        Returns:
-            (x, y, z) in world coordinates (meters)
+    def get_robust_depth(self, u: int, v: int, window: int = 5) -> float | None:
+        """Median depth over a small window; returns None if no valid pixels."""
+        if self.latest_depth is None:
+            return None
+        h, w = self.latest_depth.shape
+        half = window // 2
+        u0, u1 = max(u - half, 0), min(u + half + 1, w)
+        v0, v1 = max(v - half, 0), min(v + half + 1, h)
+        patch = self.latest_depth[v0:v1, u0:u1]
+        valid = patch[np.isfinite(patch) & (patch > 0.0)]
+        return float(np.median(valid)) if len(valid) > 0 else None
+
+    # ── Conversion methods ─────────────────────────────────────────────────────
+
+    def _intrinsic_estimate(self, u: int, v: int, Z: float) -> np.ndarray:
+        """METHOD 1: pinhole back-projection + rigid-body transform to base.
+
+        ray = cam_model.projectPixelTo3dRay((u, v))  [unit vector in cam frame]
+        p_cam = ray * Z                               [scale to depth]
+        p_base = R @ p_cam + t                        [transform to base frame]
         """
-        # ── Step 1: Linear model (Golden Zone baseline) ───────────────────────
-        feat = np.array([u, v, 1.0])
-        x = float(np.dot(self.lin_cx, feat))
-        y = float(np.dot(self.lin_cy, feat))
-
-        # ── Step 2: iLogic empirical correction ───────────────────────────────
-        corr_x, corr_y, w_norm = self._idw_correction(float(u), float(v))
-
-        if w_norm >= self._golden_weight_threshold:
-            # Problem Zone: apply correction
-            x += corr_x
-            y += corr_y
-            zone = 'problem'
+        if not self.camera_ready:
+            # Fallback: hardcoded D435i intrinsics
+            fx, fy, cx, cy = 615.0, 615.0, 320.0, 240.0
+            ray = np.array([(u - cx) / fx, (v - cy) / fy, 1.0])
         else:
-            # Golden Zone: trust linear model, skip correction
-            zone = 'golden'
+            ray = np.array(self.cam_model.projectPixelTo3dRay((u, v)))
+
+        p_cam  = ray * Z
+        p_base = self.R_base_cam @ p_cam + self.t_base_cam
+        return p_base
+
+    def _empirical_estimate(self, u: int, v: int) -> np.ndarray:
+        """METHOD 2: simple linear model fitted from calibration data."""
+        feat = np.array([1.0, float(u), float(v)])
+        x = float(np.dot(self._emp_ax, feat))
+        y = float(np.dot(self._emp_ay, feat))
+        return np.array([x, y, self._emp_z])
+
+    def _hybrid_estimate(
+        self,
+        u: int, v: int,
+        p_intrinsic: np.ndarray,
+        p_empirical: np.ndarray,
+    ) -> tuple[np.ndarray, float, float]:
+        """HYBRID: Gaussian-weighted blend.
+
+        Empirical weight is highest at the image centre (calibration region)
+        and decays towards the edges; intrinsic picks up the slack.
+        """
+        uc, vc = self._image_center
+        dist   = math.sqrt((u - uc) ** 2 + (v - vc) ** 2)
+        sigma  = math.sqrt(uc ** 2 + vc ** 2) * self._blend_sigma_frac  # ~σ in pixels
+
+        w_emp  = math.exp(-dist / sigma)
+        w_int  = 1.0 - w_emp
+
+        p_hybrid = w_emp * p_empirical + w_int * p_intrinsic
+        return p_hybrid, w_emp, w_int
+
+    # ── Service handler ────────────────────────────────────────────────────────
+
+    def handle_pixel_to_real(self, request, response):
+        u = int(request.u)
+        v = int(request.v)
+
+        # ── Depth ─────────────────────────────────────────────────────────────
+        Z = self.get_robust_depth(u, v)
+        if Z is None:
+            self.get_logger().warn(f'No valid depth at ({u},{v}), using 0.8 m fallback.')
+            Z = 0.8   # fallback to estimated table depth
 
-        self.get_logger().debug(
-            f'iLogic zone={zone} w_norm={w_norm:.3f} '  
-            f'corr=({corr_x:+.4f},{corr_y:+.4f}) '  
-            f'-> x={x:.4f} y={y:.4f}'
+        # ── Compute both estimates ────────────────────────────────────────────
+        p_int = self._intrinsic_estimate(u, v, Z)
+        p_emp = self._empirical_estimate(u, v)
+
+        # ── Blend ─────────────────────────────────────────────────────────────
+        p_hybrid, w_emp, w_int = self._hybrid_estimate(u, v, p_int, p_emp)
+
+        response.x = float(p_hybrid[0])
+        response.y = float(p_hybrid[1])
+        response.z = float(p_hybrid[2])
+
+        self.get_logger().info(
+            f'Pixel ({u},{v}) depth={Z:.3f}m | '
+            f'Intrinsic=[{p_int[0]:.4f},{p_int[1]:.4f},{p_int[2]:.4f}] '
+            f'Empirical=[{p_emp[0]:.4f},{p_emp[1]:.4f}] '
+            f'Hybrid=[{p_hybrid[0]:.4f},{p_hybrid[1]:.4f},{p_hybrid[2]:.4f}] '
+            f'(w_emp={w_emp:.3f} w_int={w_int:.3f})'
         )
 
-        # ── Step 3: Depth → z ─────────────────────────────────────────────────
-        if self.real_hardware:
-            z = depth_m
-        elif self.depth_reference is not None:
-            z = self.z_table + (self.depth_reference - depth_m)
-        else:
-            self.depth_reference = depth_m
-            self.get_logger().info(f'Set depth reference: {self.depth_reference:.3f}m at z={self.z_table}m')
-            z = self.z_table
-
-        return (x, y, z)
-
-    def read_depth_at(self, u: float, v: float, max_search: int = 5):
-        """Read depth with bilinear interpolation; if invalid, search a median window.
-        Returns depth in meters. Assumes table is at 0.8m depth.
-        
-        Handles invalid depth (NaN/zero/inf) common on reflective surfaces or sensor noise
-        by searching a 5-pixel neighborhood and taking the median of valid depth values.
-        
-        The depth sensor returns distance from camera. We assume the table surface
-        is at 0.8m from the camera, which should be the largest/most common depth value.
-        """
-        if self.latest_depth is None:
-            self.get_logger().warn('No depth image available, using default table depth 0.8m')
-            return 0.8  # Default table depth
-        
-        depth = self.latest_depth
-        h, w = depth.shape[:2]
-        if not (0 <= int(v) < h and 0 <= int(u) < w):
-            return 0.8  # Default if out of bounds
-
-        def bilinear(u_, v_):
-            x0 = int(math.floor(u_)); x1 = min(x0 + 1, w - 1)
-            y0 = int(math.floor(v_)); y1 = min(y0 + 1, h - 1)
-            wa = (x1 - u_) * (y1 - v_)
-            wb = (u_ - x0) * (y1 - v_)
-            wc = (x1 - u_) * (v_ - y0)
-            wd = (u_ - x0) * (v_ - y0)
-            d00 = float(depth[y0, x0]); d10 = float(depth[y0, x1])
-            d01 = float(depth[y1, x0]); d11 = float(depth[y1, x1])
-            d = wa * d00 + wb * d10 + wc * d01 + wd * d11
-            if np.isnan(d) or d <= 0.0 or np.isinf(d):
-                return None
-            return float(d)
-
-
-        #ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 220, v: 220}"
-        # Use topic-based depth reading for both hardware and simulation
-        if self.latest_depth is not None:
-            d = self.latest_depth[int(v), int(u)]
-            self.get_logger().info(f'Read depth at ({u},{v}): {d:.3f}m from topic')
-        else:
-                    self.get_logger().warn('No depth data available, using default 0.8m')
-                    return 0.8
-
-
-
-
-
-
-
-
-        # Fallback: collect valid depths in neighborhood and take median
-        valid_depths = []
-        for du in range(-max_search, max_search + 1):
-            for dv in range(-max_search, max_search + 1):
-                uu = u + du
-                vv = v + dv
-                if 0 <= int(uu) < w and 0 <= int(vv) < h:
-                    d_val = bilinear(uu, vv)
-                    if d_val is not None:
-                        valid_depths.append(d_val)
-        
-        if len(valid_depths) == 0:
-            self.get_logger().warn(f'No valid depth found within {max_search}px of ({u:.1f},{v:.1f}), using table depth 0.8m')
-            return 0.8  # Default table depth
-        
-        # Use median to be robust against outliers
-        median_depth = float(np.median(valid_depths))
-        return median_depth
-
-    def backproject(self, u: float, v: float, d: float):
-        # Use camera_info intrinsics
-        K = self.camera_info.k
-        fx = K[0]; fy = K[4]; cx = K[2]; cy = K[5]
-        x_c = (u - cx) * d / fx
-        y_c = (v - cy) * d / fy
-        z_c = d
-        return np.array([x_c, y_c, z_c], dtype=np.float64)
-
-    def handle_pixel_to_real(self, req, resp):
-        """Handle pixel to real coordinate conversion service request."""
-        # Get pixel coordinates from request (int32 fields)
-        u = int(req.u)
-        v = int(req.v)
-
-        # Get depth at this pixel (default to table depth 0.8m)
-        depth_m = self.read_depth_at(float(u), float(v))
-        
-        # Convert pixel to world coordinates using calibration
-        x_w, y_w, z_w = self.pixel_to_world_calibrated(u, v, depth_m)
-        
-        # DEBUG: Visualize the pixel location and world coordinates on the image
-        if self.latest_rgb is not None:
-            debug_img = self.latest_rgb.copy()
-            
-            # Draw a large crosshair at the requested pixel
-            cv2.drawMarker(debug_img, (u, v), (0, 0, 255), cv2.MARKER_CROSS, 40, 3)
-            
-            # Draw a circle around it
-            cv2.circle(debug_img, (u, v), 20, (0, 255, 0), 2)
-            
-            # Add text label with pixel coordinates
-            label_pixel = f"Pixel: ({u}, {v})"
-            cv2.putText(debug_img, label_pixel, (u + 25, v - 45),
-                       cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 0, 255), 2)
-            
-            # Add text label with world coordinates
-            label_world = f"World: ({x_w:.3f}, {y_w:.3f}, {z_w:.3f})m"
-            cv2.putText(debug_img, label_world, (u + 25, v - 20),
-                       cv2.FONT_HERSHEY_SIMPLEX, 0.6, (255, 0, 255), 2)
-            
-            # Add depth label
-            label_depth = f"Depth: {depth_m:.3f}m"
-            cv2.putText(debug_img, label_depth, (u + 25, v + 5),
-                       cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 255, 255), 2)
-            
-            # Draw frame-centre marker (approximate optical centre)
-            origin_u, origin_v = 320, 240
-            if 0 <= origin_u < debug_img.shape[1] and 0 <= origin_v < debug_img.shape[0]:
-                cv2.drawMarker(debug_img, (origin_u, origin_v), (255, 255, 0), 
-                             cv2.MARKER_TILTED_CROSS, 30, 2)
-                cv2.putText(debug_img, "Origin (0,0)", (origin_u + 10, origin_v - 10),
-                           cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 255, 0), 2)
-            
-            # Draw coordinate axes for reference
-            cv2.putText(debug_img, "u -> (right)", (10, 30),
-                       cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 0, 0), 2)
-            cv2.putText(debug_img, "v", (10, 55),
-                       cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
-            cv2.putText(debug_img, "|", (10, 68),
-                       cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
-            cv2.putText(debug_img, "v (down)", (10, 85),
-                       cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
-            
-            # Publish debug image
-            try:
-                debug_msg = self.bridge.cv2_to_imgmsg(debug_img, encoding='bgr8')
-                debug_msg.header.stamp = self.get_clock().now().to_msg()
-                debug_msg.header.frame_id = 'camera_link'
-                self.debug_pub.publish(debug_msg)
-                self.get_logger().info(f'Published debug image for pixel ({u}, {v})')
-            except Exception as e:
-                self.get_logger().error(f'Failed to publish debug image: {e}')
-
-        # Validate pixel coordinates against RGB image dimensions
-        if self.latest_rgb is not None:
-            rgb_h, rgb_w = self.latest_rgb.shape[:2]
-            if not (0 <= u < rgb_w and 0 <= v < rgb_h):
-                self.get_logger().error(f'Pixel ({u},{v}) out of RGB image bounds ({rgb_w}x{rgb_h})')
-                # Return zero coordinates for out of bounds
-                resp.x = 0.0
-                resp.y = 0.0
-                resp.z = 0.0
-                return resp
-
-        # Fill response (float64 fields)
-        resp.x = float(x_w)
-        resp.y = float(y_w)
-        resp.z = float(z_w)
-        
-        # Check if this is a known calibration point and log the error
-        for calib_point in self.validation_points:
-            if abs(u - calib_point["pixel"][0]) <= 1 and abs(v - calib_point["pixel"][1]) <= 1:
-                expected = calib_point["world"]
-                error_x = x_w - expected[0]
-                error_y = y_w - expected[1]
-                error_z = z_w - expected[2]
-                error_dist = np.sqrt(error_x**2 + error_y**2 + error_z**2)
-                
-                self.get_logger().info(
-                    f'Validation point "{calib_point["name"]}" at pixel ({u},{v}): '
-                    f'Calculated ({x_w:.3f}, {y_w:.3f}, {z_w:.3f}), '
-                    f'Expected ({expected[0]:.3f}, {expected[1]:.3f}, {expected[2]:.3f}), '
-                    f'Error: dx={error_x:.3f}m, dy={error_y:.3f}m, dz={error_z:.3f}m, dist={error_dist:.3f}m'
-                )
-                break
-        
-        self.get_logger().info(f'Pixel ({u},{v}) -> World ({x_w:.3f}m, {y_w:.3f}m, {z_w:.3f}m)')
-        return resp
+        # ── Debug image ───────────────────────────────────────────────────────
+        self._publish_debug(u, v, p_hybrid, Z)
+
+        return response
+
+    def _publish_debug(self, u: int, v: int, p: np.ndarray, depth: float):
+        if self.latest_rgb is None:
+            return
+        img = self.latest_rgb.copy()
+        cv2.drawMarker(img, (u, v), (0, 0, 255), cv2.MARKER_CROSS, 40, 3)
+        cv2.circle(img, (u, v), 20, (0, 255, 0), 2)
+        cv2.putText(img, f'Pixel: ({u},{v})',
+                    (u + 25, v - 45), cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 0, 255), 2)
+        cv2.putText(img, f'World: ({p[0]:.3f},{p[1]:.3f},{p[2]:.3f})m',
+                    (u + 25, v - 20), cv2.FONT_HERSHEY_SIMPLEX, 0.6, (255, 0, 255), 2)
+        cv2.putText(img, f'Depth: {depth:.3f}m',
+                    (u + 25, v + 5), cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 255, 255), 2)
+        uc, vc = self._image_center
+        cv2.drawMarker(img, (uc, vc), (255, 255, 0), cv2.MARKER_TILTED_CROSS, 30, 2)
+        try:
+            msg = self.bridge.cv2_to_imgmsg(img, encoding='bgr8')
+            msg.header.stamp = self.get_clock().now().to_msg()
+            self.debug_pub.publish(msg)
+        except Exception as e:
+            self.get_logger().error(f'Debug publish error: {e}')
 
 
 def main(args=None):

From 4d479260bc6f4386c83e8c267c2226d00a5529b2 Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Fri, 10 Apr 2026 01:58:56 +0700
Subject: [PATCH 10/16] fix: change empirical equation to pixel to real world

---
 vision/pixel_to_real.py       | 639 ++++++++++++++++++++++------------
 vision/pixel_to_real_world.py |  90 ++++-
 2 files changed, 497 insertions(+), 232 deletions(-)

diff --git a/vision/pixel_to_real.py b/vision/pixel_to_real.py
index 3347431..dc5d75a 100644
--- a/vision/pixel_to_real.py
+++ b/vision/pixel_to_real.py
@@ -8,48 +8,76 @@
     int32 u     # pixel column (x-coordinate, positive to the right)
     int32 v     # pixel row (y-coordinate, positive downward)
   Response:
-    float64 x   # world X coordinate (m)
-    float64 y   # world Y coordinate (m, positive forward/away from camera)
+    float64 x   # world X coordinate (m, positive to the right)
+    float64 y   # world Y coordinate (m, positive forward/away from camera) - with -0.722m offset applied
     float64 z   # world Z coordinate (m, height above table/ground)
 
-Calibration Methods (Hybrid):
-  METHOD 1 – Intrinsic:
-    Pinhole back-projection using camera intrinsics + known camera pose (R, t).
-    t_base_cam is the tunable offset; R_base_cam captures camera orientation.
-
-  METHOD 2 – Empirical:
-    Least-squares fit on 22 calibration points (5 measures × 2 colours × TR/BL),
-    2026-03-12, camera position [-0.0361, 0.5303, 0.6458], height 0.67 m:
-      x = -0.56859693 + 0.00130317*u + 0.00002114*v   (RMS 12.1 mm)
-      y =  0.98011251 - 0.00002728*u - 0.00133088*v   (RMS 16.9 mm)
-      2D RMSE = 20.8 mm
-
-  HYBRID:
-    Gaussian blend – empirical weighted higher near image centre (calibration
-    region), intrinsic weighted higher toward edges.
-
-Tuning:
-  • t_base_cam  – translate camera origin in base frame (x, y, z)
-  • Empirical coefficients – refit from new calibration measurements
-
+Calibration Data:
+  - Origin (0, 0, 0.8) in world: pixel (320, 500) - bottom center of image
+  - Green box at world (0.5, 0, 0.8): pixel (320, 240)
+  - Gear part at world (0.83, 0.03, 0.8): pixel (305, 95)
+  - Drill at world (0.571546, -0.240961, 0.831898): pixel (466, 160.5)
+  - Monkey wrench at world (0.623673, 0.372909, 0.806652): pixel (150, 200)
+  - Table depth: 0.8 m from camera
+  - Coordinate mapping:
+    * u increases right → y DECREASES (u represents -y direction)
+    * v increases down → x DECREASES (v represents -x direction)
+    * x in world increases upward in image (opposite of v)
+    * y in world increases leftward in image (opposite of u)
+
+Setup:
+  1. Build the custom_interfaces package:
+     cd ~/final_project_ws
+     colcon build --packages-select custom_interfaces
+     source install/setup.bash
+
+  2. Build the vision package:
+     colcon build --packages-select vision --symlink-install
+     source install/setup.bash
+
+  3. Start the pixel_to_real service node:
+     ros2 run vision pixel_to_real_service
+
+Usage:
   # Example: green box at pixel (320, 240) → world (0.5, 0.0, 0.8)
   ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 320, v: 240}"
-  
+
   # Example: gear part at pixel (305, 95) → world (0.83, 0.03, 0.8)
   ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 305, v: 95}"
-  
+
   # Example: drill at pixel (466, 160.5) → world (0.571546, -0.240961, 0.831898)
   ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 466, v: 160}"
-  
+
   # Example: monkey wrench at pixel (150, 200) → world (0.623673, 0.372909, 0.806652)
   ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 150, v: 200}"
-  
+
   # Example: origin at pixel (320, 500) → world (0.0, 0.0, 0.8)
   ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 320, v: 500}"
-  
+
   # View debug visualization:
   rqt_image_view /pixel_to_real/debug_image
 
+How it works:
+  Uses calibration points to compute a linear pixel-to-world transformation.
+  Reads depth from /camera/depth/image_raw to determine z-coordinate.
+  Shows debug visualization with pixel location and computed world coordinates.
+"""
+
+
+"""
+# linear approx. formula
+# Given pixel coordinates (u, v) and depth d from sensor:
+
+# Step 1: Calculate pixel offset from origin
+du = u - 320  # Origin u-coordinate
+dv = v - 500  # Origin v-coordinate
+
+# Step 2: Apply scaling and sign conversion
+x = -dv * 0.001923  # scale_x = 0.5/260 ≈ 0.001923 m/pixel
+y = -du * 0.002     # scale_y = 0.03/15 = 0.002 m/pixel
+
+# Step 3: Convert depth to z-coordinate
+z = 0.8 + (depth_reference - d)  # depth_reference set on first call
 
 
 """
@@ -57,240 +85,413 @@
 import rclpy
 from rclpy.node import Node
 from sensor_msgs.msg import Image, CameraInfo
+from geometry_msgs.msg import PointStamped
 from cv_bridge import CvBridge
 import numpy as np
 import math
+import tf2_ros
 import cv2
+import pyrealsense2 as rs
 
-from image_geometry import PinholeCameraModel
-
+# Replace with your actual service type. The repo often imports custom interfaces
+# from `custom_interfaces.srv`. Adjust the import if your package name differs.
 try:
     from custom_interfaces.srv import PixelToReal
 except Exception:
+    # The import may fail in editors; keep the name for when the package is built.
     PixelToReal = None
 
 
 class PixelToRealServer(Node):
-
-    def __init__(self):
+    def __init__(self,
+                 rgb_topic: str = '/camera/image_raw',
+                 depth_topic: str = '/camera/depth/image_raw',
+                 info_topic: str = '/camera/camera_info',
+                 default_target_frame: str = 'world'):
         super().__init__('pixel_to_real_server')
 
-        self.declare_parameter('real_hardware', True)
+        # Parameter toggles simulated vs hardware camera topics
+        self.declare_parameter('real_hardware', False)
         self.real_hardware = bool(self.get_parameter('real_hardware').value)
 
+        # RealSense-specific variables for hardware mode
+        self.rs_pipeline = None
+        self.rs_align = None
+        self.rs_intrinsics = None
+
         if self.real_hardware:
-            depth_topic      = '/camera/depth/image_rect_raw'
-            info_topic       = '/camera/color/camera_info'
-            rgb_topic        = '/camera/color/image_raw'
+            self.rgb_topic = '/camera/color/image_raw'
+            self.depth_topic = '/camera/depth/image_rect_raw'
+            self.camera_info_topic = 'camera/color/camera_info'
+            self.color_encoding = 'passthrough'
+            self.depth_32_encoding = 'passthrough'
+            self.depth_16_encoding = 'passthrough'
+
+            # Note: We DO NOT initialize RealSense pipeline here!
+            # The camera is published by a separate node (e.g., realsense-ros)
+            # We only subscribe to the published topics
+            self.get_logger().info('Real hardware mode: subscribing to RealSense topics')
+            self.get_logger().info(f'  RGB: {self.rgb_topic}')
+            self.get_logger().info(f'  Depth: {self.depth_topic}')
+            self.get_logger().info(f'  Camera Info: {self.camera_info_topic}')
         else:
-            depth_topic      = '/camera/depth/image_raw'
-            info_topic       = '/camera/camera_info'
-            rgb_topic        = '/camera/image_raw'
-
-        self.bridge     = CvBridge()
-        self.cam_model  = PinholeCameraModel()
-
-        self.latest_rgb   = None
+            self.rgb_topic = rgb_topic or '/camera/image_raw'
+            self.depth_topic = depth_topic or '/camera/depth/image_raw'
+            self.camera_info_topic = info_topic or '/camera/camera_info'
+            self.color_encoding = 'bgr8'
+            self.depth_32_encoding = '32FC1'
+            self.depth_16_encoding = '16UC1'
+
+        self.bridge = CvBridge()
+        self.latest_rgb = None
+        self.latest_rgb_header = None
         self.latest_depth = None
-        self.camera_ready = False
+        self.latest_depth_header = None
+        self.camera_info = None
+        self.default_target_frame = default_target_frame
 
-        self.depth_sub = self.create_subscription(Image,      depth_topic, self.depth_cb, 10)
-        self.info_sub  = self.create_subscription(CameraInfo, info_topic,  self.info_cb,  10)
-        self.rgb_sub   = self.create_subscription(Image,      rgb_topic,   self.rgb_cb,   10)
+        self.rgb_sub = self.create_subscription(Image, self.rgb_topic, self.rgb_cb, 10)
+        self.depth_sub = self.create_subscription(Image, self.depth_topic, self.depth_cb, 10)
+        self.info_sub = self.create_subscription(CameraInfo, self.camera_info_topic, self.info_cb, 10)
 
+        # Publisher for debug visualization
         self.debug_pub = self.create_publisher(Image, '/pixel_to_real/debug_image', 10)
 
-        # ── Depth scale (16UC1 → metres) ─────────────────────────────────────
-        self.depth_scale = 0.001   # mm → m
-
-        # ── METHOD 1: Camera pose in base_link ───────────────────────────────
-        # t_base_cam  : camera origin expressed in base frame  ← TUNE THIS
-        # R_base_cam  : rotation that maps camera axes to base axes
-        #               (camera Z forward → base -Z, camera Y down → base -Y)
-        self.t_base_cam = np.array([-0.146, 0.635, 0.8])   # <-- adjust here
-
-        self.R_base_cam = np.array([
-            [ 1.0,  0.0,  0.0],
-            [ 0.0, -1.0,  0.0],
-            [ 0.0,  0.0, -1.0],
-        ])
-
-        # ── METHOD 2: Empirical linear model ─────────────────────────────────
-        # Least-squares fit on 22 calibration points (5 measures × 2 colours
-        # × TR/BL), 2026-03-12.  Model:  x = a0 + a1*u + a2*v
-        #                                y = b0 + b1*u + b2*v
-        # 2D RMSE = 20.8 mm  (x: 12.1 mm, y: 16.9 mm)
-        self._emp_ax = np.array([-0.56859693, +0.00130317, +0.00002114])  # [1,u,v]→x
-        self._emp_ay = np.array([+0.98011251, -0.00002728, -0.00133088])  # [1,u,v]→y
-        self._emp_z  = -0.002   # table height assumption (m)
-
-        # ── Hybrid blend parameters ───────────────────────────────────────────
-        # Empirical is most accurate near image centre (calibration region).
-        # Gaussian decay controls how quickly we trust intrinsics at the edges.
-        self._image_center    = (320, 240)   # (u_c, v_c)
-        self._blend_sigma_frac = 0.6         # fraction of max diagonal for σ
-
+        # Calibration data: pixel coordinates (u, v) -> world coordinates (x, y, z)
+        # Using calibration points:
+        # Origin: (u=320, v=500) -> (x=0, y=0, z=0.8)
+        # Green box: (u=320, v=240) -> (x=0.5, y=0, z=0.8)
+        # Gear: (u=305, v=95) -> (x=0.83, y=0.03, z=0.8)
+
+        # Coordinate system mapping:
+        # u increases right -> y DECREASES (u represents -y direction)
+        # v increases down -> x DECREASES (v represents -x direction)
+
+        self.u_origin = 320  # u=320 corresponds to y=0
+        self.v_origin = 500  # v=500 corresponds to x=0
+
+        # Calculate scaling factors from calibration points:
+        # Green box: du=0, dv=-260 pixels -> dx=0.5, dy=0 meters
+        # Gear: du=-15, dv=-405 pixels -> dx=0.83, dy=0.03 meters
+
+        # From green box (vertical movement in image):
+        # dv = 240 - 500 = -260 pixels (up in image)
+        # dx = 0.5 - 0 = 0.5 meters (positive x, which is up)
+        # scale_x = 0.5 / 260 = 0.00192 m/pixel
+
+        # From gear (horizontal AND vertical movement):
+        # du = 305 - 320 = -15 pixels (left in image)
+        # dy = 0.03 - 0 = 0.03 meters (positive y, which is left)
+        # scale_y = 0.03 / 15 = 0.002 m/pixel
+
+        dv_green = 240 - 500  # -260 pixels (up in image)
+        dx_green = 0.5 - 0     # 0.5 meters (positive x in world)
+
+        du_gear = 305 - 320   # -15 pixels (left in image)
+        dy_gear = 0.03 - 0    # 0.03 meters (positive y in world)
+
+        self.scale_x = abs(dx_green / dv_green)  # 0.5/260 = 0.00192 m/pixel
+        self.scale_y = abs(dy_gear / du_gear)    # 0.03/15 = 0.002 m/pixel
+
+        # Depth calibration: Store reference depth for z-coordinate conversion
+        # At calibration points, z should be 0.8m (table height)
+        # We'll measure the actual depth sensor reading and use it as reference
+        self.z_table = 0.8  # World z-coordinate of table surface
+        self.depth_reference = None  # Will be set from first depth reading at calibration point
+
+        self.get_logger().info(f'Pixel-to-world calibration: scale_x={self.scale_x:.6f} m/px, scale_y={self.scale_y:.6f} m/px')
+        self.get_logger().info(f'Origin: pixel({self.u_origin}, {self.v_origin}) -> world(0, 0, 0.8)')
+        self.get_logger().info(f'Coordinate mapping: u right=-y, v down=-x')
+        self.get_logger().info(f'Calibrated from green box at (320,240)->(0.5,0,0.8) and gear at (305,95)->(0.83,0.03,0.8)')
+        self.get_logger().info(f'Validation point: drill at (466,160)->(0.572,-0.241,0.832)')
+        self.get_logger().info(f'Validation point: monkey_wrench at (150,200)->(0.624,0.373,0.807)')
+        self.get_logger().info(f'Depth calibration: Call service at (320,240) to set depth reference for z=0.8m')
+        self.get_logger().info(f'RGB topic: {self.rgb_topic}')
+        self.get_logger().info(f'Depth topic: {self.depth_topic}')
+        self.get_logger().info(f'Camera info topic: {self.camera_info_topic}')
+        self.get_logger().info(f'real_hardware parameter: {self.real_hardware}')
+
+        # Store calibration validation points for accuracy checking
+        self.validation_points = [
+            {"name": "green_box", "pixel": (320, 240), "world": (0.5, 0.0, 0.8)},
+            {"name": "gear", "pixel": (305, 95), "world": (0.83, 0.03, 0.8)},
+            {"name": "drill", "pixel": (466, 160), "world": (0.571546, -0.240961, 0.831898)},
+            {"name": "monkey_wrench", "pixel": (150, 200), "world": (0.623673, 0.372909, 0.806652)},
+            {"name": "origin", "pixel": (320, 500), "world": (0.0, 0.0, 0.8)}
+        ]
+
+        # TF
+        self.tf_buffer = tf2_ros.Buffer()
+        self.tf_listener = tf2_ros.TransformListener(self.tf_buffer, self)
+
+        # Create service
         if PixelToReal is not None:
-            self.srv = self.create_service(
-                PixelToReal, '/pixel_to_real', self.handle_pixel_to_real
-            )
-            self.get_logger().info('Service /pixel_to_real ready')
+            self.srv = self.create_service(PixelToReal, 'pixel_to_real', self.handle_pixel_to_real)
+            self.get_logger().info('Service /pixel_to_real ready (custom_interfaces.srv.PixelToReal)')
+            self.get_logger().info('Usage: ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 320, v: 240}"')
         else:
-            self.get_logger().error(
-                'PixelToReal srv not found – build custom_interfaces first.'
-            )
+            self.get_logger().error('PixelToReal srv type not found!')
+            self.get_logger().error('Build custom_interfaces: colcon build --packages-select custom_interfaces')
             raise RuntimeError('custom_interfaces.srv.PixelToReal not available')
 
-        self.get_logger().info(
-            f't_base_cam = {self.t_base_cam.tolist()}   '
-            f'real_hardware={self.real_hardware}'
-        )
-
-    # ── Callbacks ─────────────────────────────────────────────────────────────
-
     def rgb_cb(self, msg: Image):
+        """Store the latest RGB image for pixel coordinate validation."""
         try:
-            self.latest_rgb = self.bridge.imgmsg_to_cv2(msg, 'bgr8')
+            rgb_img = self.bridge.imgmsg_to_cv2(msg, desired_encoding=self.color_encoding)
+            self.latest_rgb = rgb_img
+            self.latest_rgb_header = msg.header
         except Exception as e:
-            self.get_logger().error(f'RGB convert error: {e}')
+            self.get_logger().error(f"Failed to convert RGB image: {e}")
 
     def depth_cb(self, msg: Image):
+        # Support 32FC1 and 16UC1 encodings; convert to float32 meters.
         try:
-            if msg.encoding in ('16UC1', '16U'):
-                raw = self.bridge.imgmsg_to_cv2(msg, 'passthrough')
-                self.latest_depth = raw.astype(np.float32) * self.depth_scale
-            elif msg.encoding in ('32FC1', '32F'):
-                self.latest_depth = self.bridge.imgmsg_to_cv2(
-                    msg, 'passthrough'
-                ).astype(np.float32)
+            if msg.encoding == '32FC1' or msg.encoding == '32F':
+                depth_img = self.bridge.imgmsg_to_cv2(msg, desired_encoding=self.depth_32_encoding)
+                depth = depth_img.astype(np.float32)
+            elif msg.encoding == '16UC1' or msg.encoding == '16U':
+                d16 = self.bridge.imgmsg_to_cv2(msg, desired_encoding=self.depth_16_encoding)
+                depth = d16.astype(np.float32) / 1000.0  # assume mm -> m
             else:
-                raw = self.bridge.imgmsg_to_cv2(msg, 'passthrough')
-                self.latest_depth = raw.astype(np.float32)
+                # Try a generic conversion to float32
+                depth_img = self.bridge.imgmsg_to_cv2(msg, desired_encoding='passthrough')
+                depth = depth_img.astype(np.float32)
+
+            self.latest_depth = depth
+            self.latest_depth_header = msg.header
         except Exception as e:
-            self.get_logger().error(f'Depth convert error: {e}')
+            self.get_logger().error(f"Failed to convert depth image: {e}")
 
     def info_cb(self, msg: CameraInfo):
-        self.cam_model.fromCameraInfo(msg)
-        self.camera_ready = True
+        self.camera_info = msg
 
-    # ── Depth reading ──────────────────────────────────────────────────────────
+    def pixel_to_world_calibrated(self, u: int, v: int, depth_m: float):
+        """Convert pixel (u,v) to world coordinates (x,y,z) using calibration.
 
-    def get_robust_depth(self, u: int, v: int, window: int = 5) -> float | None:
-        """Median depth over a small window; returns None if no valid pixels."""
-        if self.latest_depth is None:
-            return None
-        h, w = self.latest_depth.shape
-        half = window // 2
-        u0, u1 = max(u - half, 0), min(u + half + 1, w)
-        v0, v1 = max(v - half, 0), min(v + half + 1, h)
-        patch = self.latest_depth[v0:v1, u0:u1]
-        valid = patch[np.isfinite(patch) & (patch > 0.0)]
-        return float(np.median(valid)) if len(valid) > 0 else None
-
-    # ── Conversion methods ─────────────────────────────────────────────────────
-
-    def _intrinsic_estimate(self, u: int, v: int, Z: float) -> np.ndarray:
-        """METHOD 1: pinhole back-projection + rigid-body transform to base.
-
-        ray = cam_model.projectPixelTo3dRay((u, v))  [unit vector in cam frame]
-        p_cam = ray * Z                               [scale to depth]
-        p_base = R @ p_cam + t                        [transform to base frame]
+        Coordinate system:
+        - u increases right -> y DECREASES (u represents -y direction)
+        - v increases down -> x DECREASES (v represents -x direction)
+        - Origin at pixel (320, 500) = world (0, 0, 0.8)
+        - Depth is inversely related to z: small depth = high z (near camera, far from ground)
+
+        Args:
+            u: pixel column (positive right)
+            v: pixel row (positive down)
+            depth_m: depth in meters from camera (from depth sensor)
+
+        Returns:
+            (x, y, z) in world coordinates (meters)
         """
-        if not self.camera_ready:
-            # Fallback: hardcoded D435i intrinsics
-            fx, fy, cx, cy = 615.0, 615.0, 320.0, 240.0
-            ray = np.array([(u - cx) / fx, (v - cy) / fy, 1.0])
+        # Calculate pixel offset from origin
+        du = u - self.u_origin  # positive = right in image
+        dv = v - self.v_origin  # positive = down in image
+
+        # Apply transformation based on coordinate mapping:
+        # v down (-dv up) -> x increases: x = -dv * scale_x
+        # u right (-du left) -> y increases: y = -du * scale_y
+        x = -dv * self.scale_x  # Up in image -> positive x
+        y = -du * self.scale_y  # Left in image -> positive y
+
+        # Apply y-offset for robot reference frame
+        # y = y - 0.5442  # Shift y by -0.5442 meters
+
+        # Convert depth to z-coordinate
+        # Depth is inversely related to z: smaller depth = further from ground = higher z
+        # At table (z=0.8), we need to calibrate based on actual depth reading
+        # If depth_reference is set, use it; otherwise estimate from depth
+        if self.real_hardware:
+            z = depth_m  # Direct mapping for hardware
+        elif self.depth_reference is not None:
+            # z = z_table + (depth_reference - depth)
+            # When depth < depth_reference (closer to camera), z increases
+            # When depth > depth_reference (further from camera), z decreases
+            z = self.z_table + (self.depth_reference - depth_m)
         else:
-            ray = np.array(self.cam_model.projectPixelTo3dRay((u, v)))
-
-        p_cam  = ray * Z
-        p_base = self.R_base_cam @ p_cam + self.t_base_cam
-        return p_base
-
-    def _empirical_estimate(self, u: int, v: int) -> np.ndarray:
-        """METHOD 2: simple linear model fitted from calibration data."""
-        feat = np.array([1.0, float(u), float(v)])
-        x = float(np.dot(self._emp_ax, feat))
-        y = float(np.dot(self._emp_ay, feat))
-        return np.array([x, y, self._emp_z])
-
-    def _hybrid_estimate(
-        self,
-        u: int, v: int,
-        p_intrinsic: np.ndarray,
-        p_empirical: np.ndarray,
-    ) -> tuple[np.ndarray, float, float]:
-        """HYBRID: Gaussian-weighted blend.
-
-        Empirical weight is highest at the image centre (calibration region)
-        and decays towards the edges; intrinsic picks up the slack.
+            # First call: assume this is close to table depth, set reference
+            self.depth_reference = depth_m
+            self.get_logger().info(f'Set depth reference: {self.depth_reference:.3f}m at z={self.z_table}m')
+            z = self.z_table
+
+        return (x, y, z)
+
+    def read_depth_at(self, u: float, v: float, max_search: int = 5):
+        """Read depth with bilinear interpolation; if invalid, search a median window.
+        Returns depth in meters. Assumes table is at 0.8m depth.
+
+        Handles invalid depth (NaN/zero/inf) common on reflective surfaces or sensor noise
+        by searching a 5-pixel neighborhood and taking the median of valid depth values.
+
+        The depth sensor returns distance from camera. We assume the table surface
+        is at 0.8m from the camera, which should be the largest/most common depth value.
         """
-        uc, vc = self._image_center
-        dist   = math.sqrt((u - uc) ** 2 + (v - vc) ** 2)
-        sigma  = math.sqrt(uc ** 2 + vc ** 2) * self._blend_sigma_frac  # ~σ in pixels
-
-        w_emp  = math.exp(-dist / sigma)
-        w_int  = 1.0 - w_emp
-
-        p_hybrid = w_emp * p_empirical + w_int * p_intrinsic
-        return p_hybrid, w_emp, w_int
-
-    # ── Service handler ────────────────────────────────────────────────────────
-
-    def handle_pixel_to_real(self, request, response):
-        u = int(request.u)
-        v = int(request.v)
-
-        # ── Depth ─────────────────────────────────────────────────────────────
-        Z = self.get_robust_depth(u, v)
-        if Z is None:
-            self.get_logger().warn(f'No valid depth at ({u},{v}), using 0.8 m fallback.')
-            Z = 0.8   # fallback to estimated table depth
-
-        # ── Compute both estimates ────────────────────────────────────────────
-        p_int = self._intrinsic_estimate(u, v, Z)
-        p_emp = self._empirical_estimate(u, v)
-
-        # ── Blend ─────────────────────────────────────────────────────────────
-        p_hybrid, w_emp, w_int = self._hybrid_estimate(u, v, p_int, p_emp)
-
-        response.x = float(p_hybrid[0])
-        response.y = float(p_hybrid[1])
-        response.z = float(p_hybrid[2])
-
-        self.get_logger().info(
-            f'Pixel ({u},{v}) depth={Z:.3f}m | '
-            f'Intrinsic=[{p_int[0]:.4f},{p_int[1]:.4f},{p_int[2]:.4f}] '
-            f'Empirical=[{p_emp[0]:.4f},{p_emp[1]:.4f}] '
-            f'Hybrid=[{p_hybrid[0]:.4f},{p_hybrid[1]:.4f},{p_hybrid[2]:.4f}] '
-            f'(w_emp={w_emp:.3f} w_int={w_int:.3f})'
-        )
-
-        # ── Debug image ───────────────────────────────────────────────────────
-        self._publish_debug(u, v, p_hybrid, Z)
-
-        return response
-
-    def _publish_debug(self, u: int, v: int, p: np.ndarray, depth: float):
-        if self.latest_rgb is None:
-            return
-        img = self.latest_rgb.copy()
-        cv2.drawMarker(img, (u, v), (0, 0, 255), cv2.MARKER_CROSS, 40, 3)
-        cv2.circle(img, (u, v), 20, (0, 255, 0), 2)
-        cv2.putText(img, f'Pixel: ({u},{v})',
-                    (u + 25, v - 45), cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 0, 255), 2)
-        cv2.putText(img, f'World: ({p[0]:.3f},{p[1]:.3f},{p[2]:.3f})m',
-                    (u + 25, v - 20), cv2.FONT_HERSHEY_SIMPLEX, 0.6, (255, 0, 255), 2)
-        cv2.putText(img, f'Depth: {depth:.3f}m',
-                    (u + 25, v + 5), cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 255, 255), 2)
-        uc, vc = self._image_center
-        cv2.drawMarker(img, (uc, vc), (255, 255, 0), cv2.MARKER_TILTED_CROSS, 30, 2)
-        try:
-            msg = self.bridge.cv2_to_imgmsg(img, encoding='bgr8')
-            msg.header.stamp = self.get_clock().now().to_msg()
-            self.debug_pub.publish(msg)
-        except Exception as e:
-            self.get_logger().error(f'Debug publish error: {e}')
+        if self.latest_depth is None:
+            self.get_logger().warn('No depth image available, using default table depth 0.8m')
+            return 0.8  # Default table depth
+
+        depth = self.latest_depth
+        h, w = depth.shape[:2]
+        if not (0 <= int(v) < h and 0 <= int(u) < w):
+            return 0.8  # Default if out of bounds
+
+        def bilinear(u_, v_):
+            x0 = int(math.floor(u_)); x1 = min(x0 + 1, w - 1)
+            y0 = int(math.floor(v_)); y1 = min(y0 + 1, h - 1)
+            wa = (x1 - u_) * (y1 - v_)
+            wb = (u_ - x0) * (y1 - v_)
+            wc = (x1 - u_) * (v_ - y0)
+            wd = (u_ - x0) * (v_ - y0)
+            d00 = float(depth[y0, x0]); d10 = float(depth[y0, x1])
+            d01 = float(depth[y1, x0]); d11 = float(depth[y1, x1])
+            d = wa * d00 + wb * d10 + wc * d01 + wd * d11
+            if np.isnan(d) or d <= 0.0 or np.isinf(d):
+                return None
+            return float(d)
+
+
+        #ros2 service call /pixel_to_real custom_interfaces/srv/PixelToReal "{u: 220, v: 220}"
+        # Use topic-based depth reading for both hardware and simulation
+        if self.latest_depth is not None:
+            d = self.latest_depth[int(v), int(u)]
+            self.get_logger().info(f'Read depth at ({u},{v}): {d:.3f}m from topic')
+        else:
+                    self.get_logger().warn('No depth data available, using default 0.8m')
+                    return 0.8
+
+
+
+
+
+
+
+
+        # Fallback: collect valid depths in neighborhood and take median
+        valid_depths = []
+        for du in range(-max_search, max_search + 1):
+            for dv in range(-max_search, max_search + 1):
+                uu = u + du
+                vv = v + dv
+                if 0 <= int(uu) < w and 0 <= int(vv) < h:
+                    d_val = bilinear(uu, vv)
+                    if d_val is not None:
+                        valid_depths.append(d_val)
+
+        if len(valid_depths) == 0:
+            self.get_logger().warn(f'No valid depth found within {max_search}px of ({u:.1f},{v:.1f}), using table depth 0.8m')
+            return 0.8  # Default table depth
+
+        # Use median to be robust against outliers
+        median_depth = float(np.median(valid_depths))
+        return median_depth
+
+    def backproject(self, u: float, v: float, d: float):
+        # Use camera_info intrinsics
+        K = self.camera_info.k
+        fx = K[0]; fy = K[4]; cx = K[2]; cy = K[5]
+        x_c = (u - cx) * d / fx
+        y_c = (v - cy) * d / fy
+        z_c = d
+        return np.array([x_c, y_c, z_c], dtype=np.float64)
+
+    def handle_pixel_to_real(self, req, resp):
+        """Handle pixel to real coordinate conversion service request."""
+        # Get pixel coordinates from request (int32 fields)
+        u = int(req.u)
+        v = int(req.v)
+
+        # Get depth at this pixel (default to table depth 0.8m)
+        depth_m = self.read_depth_at(float(u), float(v))
+
+        # Convert pixel to world coordinates using calibration
+        x_w, y_w, z_w = self.pixel_to_world_calibrated(u, v, depth_m)
+
+        # DEBUG: Visualize the pixel location and world coordinates on the image
+        if self.latest_rgb is not None:
+            debug_img = self.latest_rgb.copy()
+
+            # Draw a large crosshair at the requested pixel
+            cv2.drawMarker(debug_img, (u, v), (0, 0, 255), cv2.MARKER_CROSS, 40, 3)
+
+            # Draw a circle around it
+            cv2.circle(debug_img, (u, v), 20, (0, 255, 0), 2)
+
+            # Add text label with pixel coordinates
+            label_pixel = f"Pixel: ({u}, {v})"
+            cv2.putText(debug_img, label_pixel, (u + 25, v - 45),
+                       cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 0, 255), 2)
+
+            # Add text label with world coordinates
+            label_world = f"World: ({x_w:.3f}, {y_w:.3f}, {z_w:.3f})m"
+            cv2.putText(debug_img, label_world, (u + 25, v - 20),
+                       cv2.FONT_HERSHEY_SIMPLEX, 0.6, (255, 0, 255), 2)
+
+            # Add depth label
+            label_depth = f"Depth: {depth_m:.3f}m"
+            cv2.putText(debug_img, label_depth, (u + 25, v + 5),
+                       cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 255, 255), 2)
+
+            # Draw origin marker at (320, 500)
+            origin_u, origin_v = self.u_origin, self.v_origin
+            if 0 <= origin_u < debug_img.shape[1] and 0 <= origin_v < debug_img.shape[0]:
+                cv2.drawMarker(debug_img, (origin_u, origin_v), (255, 255, 0),
+                             cv2.MARKER_TILTED_CROSS, 30, 2)
+                cv2.putText(debug_img, "Origin (0,0)", (origin_u + 10, origin_v - 10),
+                           cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 255, 0), 2)
+
+            # Draw coordinate axes for reference
+            cv2.putText(debug_img, "u -> (right)", (10, 30),
+                       cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 0, 0), 2)
+            cv2.putText(debug_img, "v", (10, 55),
+                       cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
+            cv2.putText(debug_img, "|", (10, 68),
+                       cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
+            cv2.putText(debug_img, "v (down)", (10, 85),
+                       cv2.FONT_HERSHEY_SIMPLEX, 0.5, (0, 255, 0), 2)
+
+            # Publish debug image
+            try:
+                debug_msg = self.bridge.cv2_to_imgmsg(debug_img, encoding='bgr8')
+                debug_msg.header.stamp = self.get_clock().now().to_msg()
+                debug_msg.header.frame_id = 'camera_link'
+                self.debug_pub.publish(debug_msg)
+                self.get_logger().info(f'Published debug image for pixel ({u}, {v})')
+            except Exception as e:
+                self.get_logger().error(f'Failed to publish debug image: {e}')
+
+        # Validate pixel coordinates against RGB image dimensions
+        if self.latest_rgb is not None:
+            rgb_h, rgb_w = self.latest_rgb.shape[:2]
+            if not (0 <= u < rgb_w and 0 <= v < rgb_h):
+                self.get_logger().error(f'Pixel ({u},{v}) out of RGB image bounds ({rgb_w}x{rgb_h})')
+                # Return zero coordinates for out of bounds
+                resp.x = 0.0
+                resp.y = 0.0
+                resp.z = 0.0
+                return resp
+
+        # Fill response (float64 fields)
+        resp.x = float(x_w)
+        resp.y = float(y_w)
+        resp.z = float(z_w)
+
+        # Check if this is a known calibration point and log the error
+        for calib_point in self.validation_points:
+            if abs(u - calib_point["pixel"][0]) <= 1 and abs(v - calib_point["pixel"][1]) <= 1:
+                expected = calib_point["world"]
+                error_x = x_w - expected[0]
+                error_y = y_w - expected[1]
+                error_z = z_w - expected[2]
+                error_dist = np.sqrt(error_x**2 + error_y**2 + error_z**2)
+
+                self.get_logger().info(
+                    f'Validation point "{calib_point["name"]}" at pixel ({u},{v}): '
+                    f'Calculated ({x_w:.3f}, {y_w:.3f}, {z_w:.3f}), '
+                    f'Expected ({expected[0]:.3f}, {expected[1]:.3f}, {expected[2]:.3f}), '
+                    f'Error: dx={error_x:.3f}m, dy={error_y:.3f}m, dz={error_z:.3f}m, dist={error_dist:.3f}m'
+                )
+                break
+
+        self.get_logger().info(f'Pixel ({u},{v}) -> World ({x_w:.3f}m, {y_w:.3f}m, {z_w:.3f}m)')
+        return resp
 
 
 def main(args=None):
diff --git a/vision/pixel_to_real_world.py b/vision/pixel_to_real_world.py
index 10dab48..747b10f 100644
--- a/vision/pixel_to_real_world.py
+++ b/vision/pixel_to_real_world.py
@@ -8,6 +8,7 @@
 from cv_bridge import CvBridge
 from image_geometry import PinholeCameraModel
 import numpy as np
+import math
 
 
 class PixelToRealNode(Node):
@@ -64,7 +65,22 @@ def __init__(self):
             [0.0,  0.0, -1.0]
         ])
 
-        self.get_logger().info("PixelToReal with TF ready.")
+        # ---- METHOD 2: Empirical linear model ----
+        # Least-squares fit on 22 calibration points (5 measures × 2 colours
+        # × TR/BL), 2026-03-12.  Model:  x = a0 + a1*u + a2*v
+        #                                y = b0 + b1*u + b2*v
+        # 2D RMSE = 20.8 mm  (x: 12.1 mm, y: 16.9 mm)
+        self._emp_ax = np.array([-0.56859693, +0.00130317, +0.00002114])  # [1,u,v]→x
+        self._emp_ay = np.array([+0.98011251, -0.00002728, -0.00133088])  # [1,u,v]→y
+        self._emp_z  = 0   # table height (m)
+
+        # ---- Hybrid blend parameters ----
+        # Empirical is most accurate near image centre (calibration region).
+        # Gaussian decay controls how quickly we trust intrinsics at the edges.
+        self._image_center     = (320, 240)   # (u_c, v_c)
+        self._blend_sigma_frac = 0.6          # fraction of max diagonal for σ
+
+        self.get_logger().info("PixelToReal with empirical + intrinsic hybrid ready.")
 
     # --------------------------------------------------
 
@@ -97,6 +113,49 @@ def get_robust_depth(self, u, v, window_size=5):
 
     # --------------------------------------------------
 
+    def _intrinsic_estimate(self, u: int, v: int, Z: float) -> np.ndarray:
+        """METHOD 1: pinhole back-projection + rigid-body transform to base."""
+        ray = self.cam_model.projectPixelTo3dRay((u, v))
+        p_cam = np.array(ray) * Z
+        p_base = self.R_base_cam @ p_cam + self.t_base_cam
+        return p_base
+
+    def _empirical_estimate(self, u: int, v: int) -> np.ndarray:
+        """METHOD 2: simple linear model fitted from calibration data.
+
+        Least-squares fit on 22 calibration points, 2026-03-12:
+          x = -0.56859693 + 0.00130317*u + 0.00002114*v   (RMS 12.1 mm)
+          y =  0.98011251 - 0.00002728*u - 0.00133088*v   (RMS 16.9 mm)
+          2D RMSE = 20.8 mm
+        """
+        feat = np.array([1.0, float(u), float(v)])
+        x = float(np.dot(self._emp_ax, feat))
+        y = float(np.dot(self._emp_ay, feat))
+        return np.array([x, y, self._emp_z])
+
+    def _hybrid_estimate(
+        self,
+        u: int, v: int,
+        p_intrinsic: np.ndarray,
+        p_empirical: np.ndarray,
+    ) -> tuple:
+        """HYBRID: Gaussian-weighted blend.
+
+        Empirical weight is highest at the image centre (calibration region)
+        and decays towards the edges; intrinsic picks up the slack.
+        """
+        uc, vc = self._image_center
+        dist  = math.sqrt((u - uc) ** 2 + (v - vc) ** 2)
+        sigma = math.sqrt(uc ** 2 + vc ** 2) * self._blend_sigma_frac
+
+        w_emp = math.exp(-dist / sigma)
+        w_int = 1.0 - w_emp
+
+        p_hybrid = w_emp * p_empirical + w_int * p_intrinsic
+        return p_hybrid, w_emp, w_int
+
+    # --------------------------------------------------
+
     def handle_pixel_to_real(self, request, response):
 
         if self.depth_image is None or not self.camera_ready:
@@ -113,21 +172,26 @@ def handle_pixel_to_real(self, request, response):
 
         Z = float(depth_raw) * self.depth_scale
 
-        # Camera frame 3D
-        ray = self.cam_model.projectPixelTo3dRay((u, v))
+        # METHOD 1: intrinsic back-projection
+        p_int = self._intrinsic_estimate(u, v, Z)
 
-        X_cam = ray[0] * Z
-        Y_cam = ray[1] * Z
-        Z_cam = Z
+        # METHOD 2: empirical linear model
+        p_emp = self._empirical_estimate(u, v)
 
-        p_cam = np.array([X_cam, Y_cam, Z_cam])
+        # HYBRID: Gaussian-weighted blend
+        p_hybrid, w_emp, w_int = self._hybrid_estimate(u, v, p_int, p_emp)
 
-        # Transform to base frame
-        p_base = self.R_base_cam @ p_cam + self.t_base_cam
+        response.x = float(p_hybrid[0])
+        response.y = float(p_hybrid[1])
+        response.z = float(p_hybrid[2])
 
-        response.x = float(p_base[0])
-        response.y = float(p_base[1])
-        response.z = float(p_base[2])
+        self.get_logger().info(
+            f'Pixel ({u},{v}) depth={Z:.3f}m | '
+            f'Intrinsic=[{p_int[0]:.4f},{p_int[1]:.4f},{p_int[2]:.4f}] '
+            f'Empirical=[{p_emp[0]:.4f},{p_emp[1]:.4f}] '
+            f'Hybrid=[{p_hybrid[0]:.4f},{p_hybrid[1]:.4f},{p_hybrid[2]:.4f}] '
+            f'(w_emp={w_emp:.3f} w_int={w_int:.3f})'
+        )
 
         return response
 
@@ -141,4 +205,4 @@ def main(args=None):
 
 
 if __name__ == "__main__":
-    main()
\ No newline at end of file
+    main()

From f646fff6eb03316da233eb2501007e040aed8c3a Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Fri, 10 Apr 2026 02:15:32 +0700
Subject: [PATCH 11/16] feat: add benchmark branch

---
 vision/pixel_to_real.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/vision/pixel_to_real.py b/vision/pixel_to_real.py
index dc5d75a..21eec56 100644
--- a/vision/pixel_to_real.py
+++ b/vision/pixel_to_real.py
@@ -508,3 +508,4 @@ def main(args=None):
 
 if __name__ == '__main__':
     main()
+

From e33e24483000b19fc594cab5a912d74cb424c05f Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Fri, 10 Apr 2026 05:59:23 +0700
Subject: [PATCH 12/16] feat: develop a working dashboard for benchmark SAM

---
 launch/vision.launch.py                    |   9 +
 setup.py                                   |   2 +-
 vision/benchmark_dashboard.py              |  64 ++--
 vision/simple_sam_detector.py              | 106 ++++-
 vision_scripts/test_dashboard_data_flow.py | 426 +++++++++++++++++++++
 5 files changed, 582 insertions(+), 25 deletions(-)
 create mode 100644 vision_scripts/test_dashboard_data_flow.py

diff --git a/launch/vision.launch.py b/launch/vision.launch.py
index 21011ad..6d6119c 100644
--- a/launch/vision.launch.py
+++ b/launch/vision.launch.py
@@ -42,4 +42,13 @@ def generate_launch_description():
     )
     ld.add_action(scene_understanding_node)
 
+    benchmark_dashboard_node = Node(
+        package='vision',
+        executable='benchmark_dashboard',
+        name='benchmark_dashboard_node',
+        output='screen',
+        emulate_tty=True
+    )
+    ld.add_action(benchmark_dashboard_node)
+
     return ld
diff --git a/setup.py b/setup.py
index 569de07..c221795 100644
--- a/setup.py
+++ b/setup.py
@@ -76,7 +76,7 @@
             'find_boundary_service = vision.find_boundary_service_node:main',
             'find_multi_object = vision.find_multi_object:main',
             # 'calibrate = calibration.calibrate:main',
-            # 'benchmark_dashboard = vision.benchmark_dashboard:main',
+             'benchmark_dashboard = vision.benchmark_dashboard:main',
             # 'show_rgb_image = vision.show_rgb_image_node:main',
             # 'show_depth_image = vision.show_depth_image_node:main',
             # 'sam_vision_pipeline = vision.sam_vision_pipeline_node:main',
diff --git a/vision/benchmark_dashboard.py b/vision/benchmark_dashboard.py
index 552365c..beca947 100644
--- a/vision/benchmark_dashboard.py
+++ b/vision/benchmark_dashboard.py
@@ -25,6 +25,7 @@
 from std_srvs.srv import Trigger
 from std_msgs.msg import String
 import json
+import numpy as np
 import time
 from datetime import datetime
 from http.server import HTTPServer, SimpleHTTPRequestHandler
@@ -45,6 +46,18 @@
     print("Custom interfaces not available. Build custom_interfaces package first.")
 
 
+class _ROSJSONEncoder(json.JSONEncoder):
+    """JSON encoder that handles ROS/numpy integer and float types."""
+    def default(self, obj):
+        if isinstance(obj, (np.integer,)):
+            return int(obj)
+        if isinstance(obj, (np.floating,)):
+            return float(obj)
+        if isinstance(obj, np.ndarray):
+            return obj.tolist()
+        return super().default(obj)
+
+
 class BenchmarkDashboard(Node):
     """
     Benchmark Dashboard - Monitors vision services and provides web interface
@@ -152,20 +165,20 @@ def sam_detections_callback(self, msg):
                 'frame_id': msg.header.frame_id,
                 'obj_id': detection.object_id,
                 'bbox': {
-                    'x1': detection.bbox[0],
-                    'y1': detection.bbox[1],
-                    'x2': detection.bbox[2],
-                    'y2': detection.bbox[3]
+                    'x1': int(detection.bbox[0]),
+                    'y1': int(detection.bbox[1]),
+                    'x2': int(detection.bbox[2]),
+                    'y2': int(detection.bbox[3])
                 },
                 'center': {
-                    'u': detection.center[0],
-                    'v': detection.center[1]
+                    'u': int(detection.center[0]),
+                    'v': int(detection.center[1])
                 },
                 'confidence': float(detection.confidence),
-                'area': detection.area,
+                'area': int(detection.area),
                 'distance_cm': float(detection.distance_cm),
                 'iou_score': float(detection.iou_score),
-                'is_stable': detection.is_stable_detection,
+                'is_stable': bool(detection.is_stable_detection),
                 'ap_iou_threshold': 0.5 if detection.is_stable_detection else 0.0
             }
             
@@ -193,10 +206,10 @@ def scene_understanding_callback(self, msg):
         scene_data = {
             'timestamp': timestamp,
             'scene_id': msg.scene_id,
-            'total_objects': msg.total_objects,
+            'total_objects': int(msg.total_objects),
             'relations': relations,
             'object_labels': list(msg.object_labels),
-            'object_counts': list(msg.object_counts),
+            'object_counts': [int(c) for c in msg.object_counts],
             'graspable_objects': msg.graspable_objects,
             'average_distance_cm': float(msg.average_distance_cm),
             'scene_description': msg.scene_description,
@@ -276,10 +289,10 @@ def add_grasp_detection_record(self, grasp_pose):
             'timestamp': timestamp,
             'test_id': len(self.data['grasp_detections']) + 1,
             'object_id': grasp_pose.object_id,
-            'bbox': list(grasp_pose.bbox),
+            'bbox': [int(v) for v in grasp_pose.bbox],
             'pixel_position': {
-                'u': grasp_pose.bbox[0] + (grasp_pose.bbox[2] - grasp_pose.bbox[0]) // 2,
-                'v': grasp_pose.bbox[1] + (grasp_pose.bbox[3] - grasp_pose.bbox[1]) // 2
+                'u': int(grasp_pose.bbox[0]) + (int(grasp_pose.bbox[2]) - int(grasp_pose.bbox[0])) // 2,
+                'v': int(grasp_pose.bbox[1]) + (int(grasp_pose.bbox[3]) - int(grasp_pose.bbox[1])) // 2
             },
             'world_position': {
                 'x': float(grasp_pose.position.x),
@@ -302,7 +315,7 @@ def add_grasp_detection_record(self, grasp_pose):
     def publish_data(self):
         """Publish benchmark data to topic"""
         msg = String()
-        msg.data = json.dumps(self.data)
+        msg.data = json.dumps(self.data, cls=_ROSJSONEncoder)
         self.data_publisher.publish(msg)
     
     def clear_data_callback(self, request, response):
@@ -327,18 +340,25 @@ def clear_data_callback(self, request, response):
     
     def start_http_server(self):
         """Start HTTP server for dashboard"""
-        # Get the path to the HTML file
+        # Resolve dashboard HTML using ament share directory (correct for installed packages)
+        try:
+            from ament_index_python.packages import get_package_share_directory
+            share_dir = get_package_share_directory('vision')
+            html_dir = Path(share_dir) / 'dashboard'
+        except Exception:
+            html_dir = Path(__file__).parent.parent / 'dashboard'
+
+        # History JSON is written by simple_sam_detector next to the installed module
         package_path = Path(__file__).parent.parent
-        html_dir = package_path / 'dashboard'
-        
-        # Create dashboard directory if it doesn't exist
-        html_dir.mkdir(exist_ok=True)
-        
-        # Create HTML file if it doesn't exist
+
+        self.get_logger().info(f'Dashboard HTML dir: {html_dir}')
+
+        # Fallback: create default HTML if share dir has no index.html
         html_file = html_dir / 'index.html'
         if not html_file.exists():
             self.get_logger().warn(f'Dashboard HTML not found at {html_file}')
             self.get_logger().warn('Creating basic HTML file...')
+            html_dir.mkdir(exist_ok=True)
             self.create_default_html(html_file)
         
         # Custom handler that serves files from html_dir and provides data endpoint
@@ -354,7 +374,7 @@ def do_GET(self):
                     self.send_header('Content-type', 'application/json')
                     self.send_header('Access-Control-Allow-Origin', '*')
                     self.end_headers()
-                    data_json = json.dumps(self.dashboard_node.data)
+                    data_json = json.dumps(self.dashboard_node.data, cls=_ROSJSONEncoder)
                     self.wfile.write(data_json.encode())
                 elif self.path == '/api/run-history':
                     # Serve vision_runs_history.json from workspace root
diff --git a/vision/simple_sam_detector.py b/vision/simple_sam_detector.py
index 418fad7..b303d75 100755
--- a/vision/simple_sam_detector.py
+++ b/vision/simple_sam_detector.py
@@ -485,7 +485,15 @@ def detect_objects_callback(self, request, response):
                     f"conf={confidences[i]:.2f}, dist={distances_cm[i]:.1f}cm"
                 )
             self.get_logger().info("=" * 80)
-            
+
+            # Save results to vision_runs_history.json for real-time dashboard
+            end_inner = time.perf_counter()
+            self._save_detect_objects_run(
+                object_ids, bbox_x1, bbox_y1, bbox_x2, bbox_y2,
+                confidences, distances_cm, iou_scores, is_stable_array,
+                clip_classifications, end_inner - start
+            )
+
         except Exception as e:
             response.success = False
             response.total_detections = 0
@@ -509,9 +517,103 @@ def detect_objects_callback(self, request, response):
         end = time.perf_counter()
         latency = end - start
         self.get_logger().info(f"Total detection latency: {latency:.6f} seconds")
-        
+
         return response
 
+    def _save_detect_objects_run(self, object_ids, bbox_x1, bbox_y1, bbox_x2, bbox_y2,
+                                  confidences, distances_cm, iou_scores, is_stable_array,
+                                  clip_classifications, latency_s):
+        """Save /vision/detect_objects results to vision_runs_history.json for the dashboard."""
+        try:
+            from pathlib import Path
+
+            # Same path used by benchmark_dashboard and collect_and_export
+            package_path = Path(__file__).parent.parent
+            history_file = package_path / 'vision_runs_history.json'
+
+            # Load existing history
+            history = []
+            if history_file.exists():
+                try:
+                    with open(history_file, 'r') as f:
+                        data = json.load(f)
+                    if isinstance(data, list):
+                        history = data
+                except Exception:
+                    pass
+
+            last_run_no = history[-1]['meta']['run_no'] if history else 0
+            run_no = last_run_no + 1
+
+            num_dets = len(self.latest_detections)
+            total_sam_conf = 0.0
+            objects = []
+            for idx in range(num_dets):
+                det = self.latest_detections[idx]
+                clip_info = clip_classifications.get(idx, {})
+                sam_conf = float(det.get('confidence', 0.0))
+                total_sam_conf += sam_conf
+                objects.append({
+                    'object_id':      object_ids[idx] if idx < len(object_ids) else f'object_{idx}',
+                    'label':          clip_info.get('label', '') if clip_info else '',
+                    'bbox_x1':        bbox_x1[idx] if idx < len(bbox_x1) else 0,
+                    'bbox_y1':        bbox_y1[idx] if idx < len(bbox_y1) else 0,
+                    'bbox_x2':        bbox_x2[idx] if idx < len(bbox_x2) else 0,
+                    'bbox_y2':        bbox_y2[idx] if idx < len(bbox_y2) else 0,
+                    'sam_confidence': round(sam_conf, 4),
+                    'clip_confidence': round(float(clip_info.get('confidence', 0.0)), 4) if clip_info else '',
+                    'distance_cm':    distances_cm[idx] if idx < len(distances_cm) else '',
+                    'iou_score':      iou_scores[idx] if idx < len(iou_scores) else '',
+                    'is_stable':      is_stable_array[idx] if idx < len(is_stable_array) else '',
+                    'has_grasp':      False,
+                    'grasp':          {},
+                    'obb_angle_deg':  '', 'obb_theta_rad': '',
+                    'obb_width_px':   '', 'obb_height_px': '',
+                    'obb_center_u':   '', 'obb_center_v':  '',
+                })
+
+            avg_sam_conf = total_sam_conf / num_dets if num_dets > 0 else 0.0
+            avg_iou = sum(iou_scores) / len(iou_scores) if iou_scores else 0.0
+            stability_rate = sum(1 for s in is_stable_array if s) / len(is_stable_array) if is_stable_array else 0.0
+
+            run = {
+                'meta': {
+                    'run_no':    run_no,
+                    'timestamp': datetime.utcnow().isoformat() + 'Z',
+                    'latency_s': round(latency_s, 3),
+                    'source':    'detect_objects',
+                },
+                'sam': {
+                    'success':          True,
+                    'latency_s':        round(latency_s, 3),
+                    'total_detections': num_dets,
+                    'avg_confidence':   round(avg_sam_conf, 4),
+                    'average_iou':      round(avg_iou, 4),
+                    'stability_rate':   round(stability_rate, 4),
+                },
+                'clip': {
+                    'success':          bool(clip_classifications),
+                    'latency_s':        0.0,
+                    'filtered_regions': len(clip_classifications),
+                },
+                'scene': {'success': False, 'latency_s': 0.0},
+                'obb':   {'success': False, 'latency_s': 0.0},
+                'objects':   objects,
+                'relations': [],
+                'grasps':    [],
+            }
+
+            history.append(run)
+            history = history[-20:]  # keep last 20 runs
+
+            with open(history_file, 'w') as f:
+                json.dump(history, f, indent=2)
+
+            self.get_logger().info(f"Saved run #{run_no} to {history_file} ({num_dets} objects)")
+
+        except Exception as e:
+            self.get_logger().warn(f"Failed to save run history: {e}")
+
     def _startup_announce(self):
         """One-shot announce to make sure global topics appear after node startup."""
         try:
diff --git a/vision_scripts/test_dashboard_data_flow.py b/vision_scripts/test_dashboard_data_flow.py
new file mode 100644
index 0000000..dfc754b
--- /dev/null
+++ b/vision_scripts/test_dashboard_data_flow.py
@@ -0,0 +1,426 @@
+#!/usr/bin/env python3
+"""
+Unit test: verify detect_objects → vision_runs_history.json → dashboard data flow.
+
+Runs WITHOUT ROS2. Tests:
+  1. JSON file is written to the correct path
+  2. JSON schema matches exactly what dashboard HTML expects
+  3. /api/data live path (benchmark_dashboard SAM topic callback schema)
+  4. /api/run-history path (run history table schema)
+
+Usage:
+    python3 vision_scripts/test_dashboard_data_flow.py
+"""
+
+import json
+import os
+import sys
+import tempfile
+import traceback
+from pathlib import Path
+from datetime import datetime
+
+# ── Path setup ────────────────────────────────────────────────────────────────
+SCRIPT_DIR   = Path(__file__).resolve().parent
+PACKAGE_ROOT = SCRIPT_DIR.parent                          # src/vision/
+HISTORY_FILE = PACKAGE_ROOT / "vision_runs_history.json"
+
+PASS = "\033[92m[PASS]\033[0m"
+FAIL = "\033[91m[FAIL]\033[0m"
+INFO = "\033[94m[INFO]\033[0m"
+
+failures = []
+
+def check(name, condition, detail=""):
+    if condition:
+        print(f"  {PASS}  {name}")
+    else:
+        print(f"  {FAIL}  {name}" + (f" — {detail}" if detail else ""))
+        failures.append(name)
+
+
+# ── Fake detection data (mirrors what detect_objects_callback produces) ────────
+
+FAKE_DETECTIONS = [
+    {
+        "id":          "object_0",
+        "class_name":  "object_0",
+        "confidence":  0.82,
+        "bbox":        [100, 150, 300, 400],
+        "center":      [200, 275],
+        "area":        45000,
+        "distance_cm": 55.3,
+        "iou_score":   0.71,
+        "is_stable":   True,
+        "matched_prev_id": "",
+        "mask":        None,  # would be np array in real code
+    },
+    {
+        "id":          "object_1",
+        "class_name":  "object_1",
+        "confidence":  0.64,
+        "bbox":        [400, 200, 580, 450],
+        "center":      [490, 325],
+        "area":        34200,
+        "distance_cm": 72.1,
+        "iou_score":   0.0,
+        "is_stable":   False,
+        "matched_prev_id": "",
+        "mask":        None,
+    },
+]
+
+FAKE_CLIP = {
+    0: {"label": "cup",    "confidence": 0.91, "bbox": [100, 150, 300, 400]},
+    1: {"label": "bottle", "confidence": 0.78, "bbox": [400, 200, 580, 450]},
+}
+
+
+# ── Reproduce _save_detect_objects_run logic verbatim ─────────────────────────
+
+def simulate_save(latest_detections, clip_classifications, latency_s, history_file):
+    """Exact copy of _save_detect_objects_run from simple_sam_detector.py."""
+    history = []
+    if history_file.exists():
+        try:
+            with open(history_file, "r") as f:
+                data = json.load(f)
+            if isinstance(data, list):
+                history = data
+        except Exception:
+            pass
+
+    last_run_no = history[-1]["meta"]["run_no"] if history else 0
+    run_no = last_run_no + 1
+
+    # Build parallel arrays (same logic as detect_objects_callback)
+    object_ids    = []
+    bbox_x1, bbox_y1, bbox_x2, bbox_y2 = [], [], [], []
+    confidences   = []
+    distances_cm  = []
+    iou_scores    = []
+    is_stable_arr = []
+
+    for idx, det in enumerate(latest_detections):
+        clip_info = clip_classifications.get(idx)
+        if clip_info:
+            object_ids.append(f"{clip_info['label']}_{idx}")
+            confidences.append(float(clip_info["confidence"]))
+        else:
+            object_ids.append(det["id"])
+            confidences.append(float(det["confidence"]))
+
+        bbox = det["bbox"]
+        bbox_x1.append(bbox[0]); bbox_y1.append(bbox[1])
+        bbox_x2.append(bbox[2]); bbox_y2.append(bbox[3])
+        distances_cm.append(float(det.get("distance_cm", -1.0)))
+        iou_scores.append(float(det.get("iou_score", 0.0)))
+        is_stable_arr.append(bool(det.get("is_stable", False)))
+
+    num_dets = len(latest_detections)
+    total_sam_conf = 0.0
+    objects = []
+    for idx in range(num_dets):
+        det = latest_detections[idx]
+        clip_info = clip_classifications.get(idx, {})
+        sam_conf = float(det.get("confidence", 0.0))
+        total_sam_conf += sam_conf
+        objects.append({
+            "object_id":      object_ids[idx] if idx < len(object_ids) else f"object_{idx}",
+            "label":          clip_info.get("label", "") if clip_info else "",
+            "bbox_x1":        bbox_x1[idx] if idx < len(bbox_x1) else 0,
+            "bbox_y1":        bbox_y1[idx] if idx < len(bbox_y1) else 0,
+            "bbox_x2":        bbox_x2[idx] if idx < len(bbox_x2) else 0,
+            "bbox_y2":        bbox_y2[idx] if idx < len(bbox_y2) else 0,
+            "sam_confidence": round(sam_conf, 4),
+            "clip_confidence": round(float(clip_info.get("confidence", 0.0)), 4) if clip_info else "",
+            "distance_cm":    distances_cm[idx] if idx < len(distances_cm) else "",
+            "iou_score":      iou_scores[idx] if idx < len(iou_scores) else "",
+            "is_stable":      is_stable_arr[idx] if idx < len(is_stable_arr) else "",
+            "has_grasp":      False,
+            "grasp":          {},
+            "obb_angle_deg":  "", "obb_theta_rad": "",
+            "obb_width_px":   "", "obb_height_px": "",
+            "obb_center_u":   "", "obb_center_v":  "",
+        })
+
+    avg_sam_conf   = total_sam_conf / num_dets if num_dets > 0 else 0.0
+    avg_iou        = sum(iou_scores) / len(iou_scores) if iou_scores else 0.0
+    stability_rate = sum(1 for s in is_stable_arr if s) / len(is_stable_arr) if is_stable_arr else 0.0
+
+    run = {
+        "meta": {
+            "run_no":    run_no,
+            "timestamp": datetime.utcnow().isoformat() + "Z",
+            "latency_s": round(latency_s, 3),
+            "source":    "detect_objects",
+        },
+        "sam": {
+            "success":          True,
+            "latency_s":        round(latency_s, 3),
+            "total_detections": num_dets,
+            "avg_confidence":   round(avg_sam_conf, 4),
+            "average_iou":      round(avg_iou, 4),
+            "stability_rate":   round(stability_rate, 4),
+        },
+        "clip": {
+            "success":          bool(clip_classifications),
+            "latency_s":        0.0,
+            "filtered_regions": len(clip_classifications),
+        },
+        "scene": {"success": False, "latency_s": 0.0},
+        "obb":   {"success": False, "latency_s": 0.0},
+        "objects":   objects,
+        "relations": [],
+        "grasps":    [],
+    }
+
+    history.append(run)
+    history = history[-20:]
+
+    with open(history_file, "w") as f:
+        json.dump(history, f, indent=2)
+
+    return run, history
+
+
+# ── Test 1: File is written ────────────────────────────────────────────────────
+
+def test_file_written():
+    print("\n── Test 1: File write ───────────────────────────────────────────")
+    with tempfile.NamedTemporaryFile(suffix=".json", delete=False) as tf:
+        tmp = Path(tf.name)
+    try:
+        run, history = simulate_save(FAKE_DETECTIONS, FAKE_CLIP, 1.23, tmp)
+        check("File created", tmp.exists())
+        check("File is valid JSON", True)  # would have thrown above
+        check("History is list", isinstance(history, list))
+        check("History has 1 entry", len(history) == 1)
+        check("run_no == 1", run["meta"]["run_no"] == 1)
+        print(f"  {INFO}  Written to: {tmp}")
+        return tmp, run, history
+    except Exception as e:
+        check("No exception during save", False, str(e))
+        traceback.print_exc()
+        return None, None, None
+    finally:
+        pass  # keep file for next test
+
+
+# ── Test 2: JSON schema matches /api/run-history dashboard expectations ────────
+
+def test_run_history_schema(run):
+    print("\n── Test 2: /api/run-history schema ─────────────────────────────")
+    if run is None:
+        print("  Skipped (previous test failed)")
+        return
+
+    meta  = run.get("meta", {})
+    sam   = run.get("sam", {})
+    clip  = run.get("clip", {})
+    objs  = run.get("objects", [])
+
+    # meta fields (dashboard uses: run_no, timestamp, latency_s)
+    check("meta.run_no present",    "run_no"    in meta)
+    check("meta.timestamp present", "timestamp" in meta)
+    check("meta.latency_s present", "latency_s" in meta)
+
+    # sam fields (dashboard uses: total_detections, avg_confidence, average_iou, stability_rate, latency_s, success)
+    for field in ["total_detections", "avg_confidence", "average_iou", "stability_rate", "latency_s", "success"]:
+        check(f"sam.{field} present", field in sam)
+
+    # clip fields (dashboard uses: filtered_regions, latency_s, success)
+    for field in ["filtered_regions", "latency_s", "success"]:
+        check(f"clip.{field} present", field in clip)
+
+    # objects array
+    check("objects is list",        isinstance(objs, list))
+    check("objects not empty",      len(objs) == len(FAKE_DETECTIONS))
+
+    # per-object fields (dashboard uses all of these)
+    obj_fields = [
+        "object_id", "label", "bbox_x1", "bbox_y1", "bbox_x2", "bbox_y2",
+        "sam_confidence", "clip_confidence", "distance_cm",
+        "iou_score", "is_stable", "has_grasp", "grasp",
+        "obb_angle_deg", "obb_theta_rad",
+    ]
+    if objs:
+        for field in obj_fields:
+            check(f"objects[0].{field} present", field in objs[0])
+
+    # value spot-checks
+    check("sam.total_detections == 2",        sam.get("total_detections") == 2)
+    check("clip.filtered_regions == 2",       clip.get("filtered_regions") == 2)
+    check("object label 'cup' in object_id",  "cup" in objs[0].get("object_id", "") or objs[0].get("label") == "cup")
+    check("bbox values correct",              objs[0]["bbox_x1"] == 100 and objs[0]["bbox_y2"] == 400)
+    check("sam_confidence is float",          isinstance(objs[0]["sam_confidence"], float))
+    check("clip_confidence is float",         isinstance(objs[0]["clip_confidence"], float))
+    check("iou_score is float",               isinstance(objs[0]["iou_score"], float))
+    check("is_stable is bool",                isinstance(objs[0]["is_stable"], bool))
+
+
+# ── Test 3: /api/data schema (benchmark_dashboard SAM topic callback) ──────────
+
+def test_api_data_schema():
+    print("\n── Test 3: /api/data schema (sam_detections_callback output) ───")
+    # Replicate what benchmark_dashboard.sam_detections_callback produces
+    timestamp = datetime.now().isoformat()
+    sam_data_records = []
+    for det in FAKE_DETECTIONS:
+        bbox = det["bbox"]
+        center = det["center"]
+        record = {
+            "timestamp":        timestamp,
+            "frame_id":         "camera_link",
+            "obj_id":           det["id"],
+            "bbox":             {"x1": bbox[0], "y1": bbox[1], "x2": bbox[2], "y2": bbox[3]},
+            "center":           {"u": center[0], "v": center[1]},
+            "confidence":       float(det["confidence"]),
+            "area":             det["area"],
+            "distance_cm":      float(det["distance_cm"]),
+            "iou_score":        float(det["iou_score"]),
+            "is_stable":        bool(det["is_stable"]),
+            "ap_iou_threshold": 0.5 if det["is_stable"] else 0.0,
+        }
+        sam_data_records.append(record)
+
+    # Check each field that updateSAMDetections() accesses in the HTML
+    r = sam_data_records[0]
+    for field in ["obj_id", "bbox", "center", "confidence", "iou_score", "is_stable", "distance_cm", "timestamp"]:
+        check(f"sam record has '{field}'", field in r)
+
+    check("bbox has x1/y1/x2/y2",   all(k in r["bbox"] for k in ["x1","y1","x2","y2"]))
+    check("center has u/v",          all(k in r["center"] for k in ["u","v"]))
+    check("confidence is numeric",   isinstance(r["confidence"], float))
+    check("distance_cm is numeric",  isinstance(r["distance_cm"], float))
+
+    # Simulate full /api/data structure
+    api_data = {
+        "pixel_to_real":       [],
+        "sam_detections":      sam_data_records,
+        "clip_classifications":[],
+        "grasp_detections":    [],
+        "scene_understanding": [],
+        "metadata":            {"start_time": timestamp, "total_calls": len(sam_data_records)},
+    }
+    # Check updateDashboard() fields
+    for key in ["pixel_to_real", "sam_detections", "clip_classifications",
+                "grasp_detections", "scene_understanding", "metadata"]:
+        check(f"/api/data has '{key}'", key in api_data)
+    check("metadata.total_calls present", "total_calls" in api_data["metadata"])
+
+
+# ── Test 4: Incremental append (run_no increments) ───────────────────────────
+
+def test_incremental_append(tmp_file):
+    print("\n── Test 4: Incremental append (run numbers) ─────────────────────")
+    if tmp_file is None:
+        print("  Skipped")
+        return
+    simulate_save(FAKE_DETECTIONS, FAKE_CLIP, 0.9, tmp_file)
+    simulate_save(FAKE_DETECTIONS, FAKE_CLIP, 1.1, tmp_file)
+
+    with open(tmp_file) as f:
+        history = json.load(f)
+
+    check("3 runs in history",               len(history) == 3)
+    check("run_no increments: 1,2,3",        [r["meta"]["run_no"] for r in history] == [1, 2, 3])
+    check("latest run_no is 3",              history[-1]["meta"]["run_no"] == 3)
+    check("source == 'detect_objects'",      all(r["meta"].get("source") == "detect_objects" for r in history))
+
+
+# ── Test 5: Actual HISTORY_FILE path resolution ───────────────────────────────
+
+def test_path_resolution():
+    print("\n── Test 5: Path resolution ──────────────────────────────────────")
+    # This is how simple_sam_detector.py resolves the path:
+    # Path(__file__).parent.parent where __file__ is vision/simple_sam_detector.py
+    sam_file = PACKAGE_ROOT / "vision" / "simple_sam_detector.py"
+    resolved = sam_file.parent.parent / "vision_runs_history.json"
+
+    # And how benchmark_dashboard.py resolves it:
+    dash_file = PACKAGE_ROOT / "vision" / "benchmark_dashboard.py"
+    dash_resolved = dash_file.parent.parent / "vision_runs_history.json"
+
+    check("simple_sam_detector path resolves correctly",
+          str(resolved) == str(HISTORY_FILE),
+          f"got {resolved}")
+    check("benchmark_dashboard path resolves correctly",
+          str(dash_resolved) == str(HISTORY_FILE),
+          f"got {dash_resolved}")
+    check("Both paths are identical",
+          resolved == dash_resolved)
+    check("simple_sam_detector.py exists",
+          sam_file.exists(),
+          f"missing: {sam_file}")
+    check("benchmark_dashboard.py exists",
+          dash_file.exists(),
+          f"missing: {dash_file}")
+    print(f"  {INFO}  History file path: {HISTORY_FILE}")
+
+
+# ── Test 6: Dashboard HTML endpoints exist ────────────────────────────────────
+
+def test_html_endpoints():
+    print("\n── Test 6: Dashboard HTML references ────────────────────────────")
+    html_file = PACKAGE_ROOT / "dashboard" / "index.html"
+    check("index.html exists", html_file.exists())
+    if html_file.exists():
+        content = html_file.read_text()
+        check("fetches /api/data",        "/api/data"        in content)
+        check("fetches /api/run-history", "/api/run-history" in content)
+        check("polls every 2s",           "2000"             in content)
+        check("runHistoryBody table",     "runHistoryBody"   in content)
+        check("samBody table",            "samBody"          in content)
+        check("latestObjectsBody table",  "latestObjectsBody" in content)
+
+
+# ── Main ──────────────────────────────────────────────────────────────────────
+
+def main():
+    print("=" * 65)
+    print("  Vision Dashboard Data-Flow Unit Test")
+    print("=" * 65)
+
+    tmp_file, run, history = test_file_written()
+    test_run_history_schema(run)
+    test_api_data_schema()
+    test_incremental_append(tmp_file)
+    test_path_resolution()
+    test_html_endpoints()
+
+    # Clean up temp file
+    if tmp_file and tmp_file.exists():
+        tmp_file.unlink()
+
+    print("\n" + "=" * 65)
+    if failures:
+        print(f"\033[91m  {len(failures)} FAILED:\033[0m")
+        for f in failures:
+            print(f"    • {f}")
+        print("=" * 65)
+        sys.exit(1)
+    else:
+        print(f"\033[92m  All tests passed.\033[0m")
+        print("=" * 65)
+
+    # ── Show current history file state ───────────────────────────────────────
+    print(f"\n{INFO}  Checking actual history file: {HISTORY_FILE}")
+    if HISTORY_FILE.exists():
+        with open(HISTORY_FILE) as f:
+            data = json.load(f)
+        print(f"  {PASS}  File exists — {len(data)} run(s) stored")
+        if data:
+            latest = data[-1]
+            print(f"  {INFO}  Latest run: #{latest['meta']['run_no']}  "
+                  f"ts={latest['meta']['timestamp']}  "
+                  f"objects={latest['sam']['total_detections']}")
+    else:
+        print(f"  \033[93m[WARN]\033[0m  {HISTORY_FILE} does not exist yet.")
+        print(f"         The file is created when you call:")
+        print(f"           ros2 service call /vision/detect_objects custom_interfaces/srv/DetectObjects")
+        print(f"         Make sure simple_sam_detector is running and a camera frame is available.")
+
+
+if __name__ == "__main__":
+    main()

From b328bbb0589f3db8482db30c36e4c5461653c007 Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Sat, 11 Apr 2026 04:51:13 +0700
Subject: [PATCH 13/16] feat: benchmark sam and clip and find object service

---
 dashboard/find_object.html         | 817 +++++++++++++++++++++++++++++
 dashboard/index.html               |  30 +-
 vision/benchmark_dashboard.py      | 346 +++++++++++-
 vision/clip_classifier.py          | 375 ++++++-------
 vision/find_object_service_node.py |  45 +-
 vision/obb_angle_service_node.py   | 256 ++++-----
 vision/simple_sam_detector.py      | 614 +++++++++++++++-------
 7 files changed, 1926 insertions(+), 557 deletions(-)
 create mode 100644 dashboard/find_object.html

diff --git a/dashboard/find_object.html b/dashboard/find_object.html
new file mode 100644
index 0000000..907379a
--- /dev/null
+++ b/dashboard/find_object.html
@@ -0,0 +1,817 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>Find Object — Vision Benchmark</title>
+    <style>
+        :root {
+            --bg:            #f1f5f9;
+            --surface:       #ffffff;
+            --border:        #e2e8f0;
+            --text-primary:  #0f172a;
+            --text-secondary:#64748b;
+            --text-muted:    #94a3b8;
+            --ok:   #22c55e;
+            --warn: #f59e0b;
+            --fail: #ef4444;
+            --nav-bg:   #0f172a;
+            --nav-text: #94a3b8;
+            --accent:   #6366f1;
+            --radius:    10px;
+            --radius-sm: 6px;
+            --shadow:    0 1px 3px rgba(0,0,0,.08), 0 1px 2px rgba(0,0,0,.05);
+            --shadow-md: 0 4px 6px rgba(0,0,0,.07), 0 2px 4px rgba(0,0,0,.05);
+        }
+        *, *::before, *::after { box-sizing: border-box; margin: 0; padding: 0; }
+        body {
+            font-family: -apple-system, BlinkMacSystemFont, 'Segoe UI', sans-serif;
+            background: var(--bg);
+            color: var(--text-primary);
+            font-size: 14px;
+            line-height: 1.5;
+            display: flex;
+            min-height: 100vh;
+        }
+
+        /* ── Sidebar ── */
+        #sidebar {
+            width: 226px; min-width: 226px;
+            background: var(--nav-bg);
+            position: fixed; top: 0; left: 0;
+            height: 100vh; z-index: 100;
+            display: flex; flex-direction: column;
+            overflow-y: auto;
+        }
+        .sb-brand { padding: 22px 18px 16px; border-bottom: 1px solid rgba(255,255,255,.07); }
+        .sb-brand-title { font-size: 13px; font-weight: 700; color: #fff; line-height: 1.35; }
+        .sb-brand-sub   { font-size: 11px; color: var(--nav-text); margin-top: 4px; }
+        .sb-live {
+            display: flex; align-items: center; gap: 8px;
+            padding: 9px 18px; border-bottom: 1px solid rgba(255,255,255,.07);
+            font-size: 11px; color: var(--nav-text);
+        }
+        .live-dot {
+            width: 7px; height: 7px; border-radius: 50%;
+            background: var(--ok); animation: pulse 2s infinite; flex-shrink: 0;
+        }
+        @keyframes pulse { 0%,100%{opacity:1;transform:scale(1)} 50%{opacity:.45;transform:scale(.8)} }
+        .sb-group {
+            font-size: 10px; font-weight: 700; text-transform: uppercase;
+            letter-spacing: 1.1px; color: rgba(255,255,255,.22); padding: 16px 18px 6px;
+        }
+        .sb-link {
+            display: flex; align-items: center; gap: 10px;
+            padding: 8px 18px; color: var(--nav-text); font-size: 12.5px;
+            font-weight: 500; cursor: pointer; border-left: 3px solid transparent;
+            transition: background .12s, color .12s; user-select: none;
+        }
+        .sb-link:hover { background: rgba(255,255,255,.06); color: #fff; }
+        .sb-link.active { border-left-color: var(--accent); color: #fff; background: rgba(255,255,255,.05); }
+        .sb-dot { width: 8px; height: 8px; border-radius: 50%; flex-shrink: 0; }
+        .sb-count {
+            margin-left: auto; font-size: 11px; font-weight: 600;
+            background: rgba(255,255,255,.09); padding: 1px 7px;
+            border-radius: 10px; color: rgba(255,255,255,.45);
+            min-width: 24px; text-align: center;
+        }
+
+        /* ── Main ── */
+        #main { margin-left: 226px; flex: 1; min-width: 0; display: flex; flex-direction: column; }
+        #topbar {
+            background: var(--surface); border-bottom: 1px solid var(--border);
+            padding: 13px 28px; display: flex; align-items: center; gap: 16px;
+            position: sticky; top: 0; z-index: 90; box-shadow: var(--shadow);
+        }
+        .topbar-title { font-size: 15px; font-weight: 700; }
+        .topbar-sub   { font-size: 11.5px; color: var(--text-secondary); margin-top: 1px; }
+        .topbar-right { margin-left: auto; display: flex; align-items: center; gap: 10px; }
+        .page-body { padding: 24px 28px; flex: 1; }
+
+        /* ── Buttons ── */
+        .btn {
+            padding: 8px 18px; border-radius: var(--radius-sm); font-size: 13px;
+            font-weight: 600; cursor: pointer; border: 1px solid var(--border);
+            background: transparent; color: var(--text-secondary); transition: all .13s;
+        }
+        .btn:hover { background: var(--bg); color: var(--text-primary); }
+        .btn-primary {
+            background: var(--accent); color: #fff; border-color: var(--accent);
+        }
+        .btn-primary:hover { background: #4f46e5; border-color: #4f46e5; }
+        .btn-ok   { background: #dcfce7; color: #15803d; border-color: #bbf7d0; }
+        .btn-ok:hover { background: #bbf7d0; }
+        .btn-fail { background: #fee2e2; color: #dc2626; border-color: #fecaca; }
+        .btn-fail:hover { background: #fecaca; }
+        .btn-sm { padding: 4px 12px; font-size: 12px; }
+
+        /* ── Card ── */
+        .card {
+            background: var(--surface); border: 1px solid var(--border);
+            border-radius: var(--radius); box-shadow: var(--shadow); margin-bottom: 22px;
+            overflow: hidden;
+        }
+        .card-head {
+            padding: 15px 20px; border-bottom: 1px solid var(--border);
+            display: flex; align-items: center; gap: 12px; background: #fafbfc;
+        }
+        .card-accent { width: 4px; height: 38px; border-radius: 3px; flex-shrink: 0; }
+        .card-title    { font-size: 14px; font-weight: 700; }
+        .card-subtitle { font-size: 11px; color: var(--text-secondary); margin-top: 2px; font-family: monospace; }
+        .card-badge {
+            margin-left: auto; font-size: 11px; font-weight: 700;
+            padding: 4px 12px; border-radius: 14px; color: #fff; white-space: nowrap;
+        }
+        .card-body { padding: 20px; }
+
+        /* ── Trigger panel ── */
+        .trigger-grid {
+            display: grid; grid-template-columns: 1fr auto; gap: 10px; align-items: end;
+            margin-bottom: 16px;
+        }
+        .field-group { display: flex; flex-direction: column; gap: 4px; }
+        .field-label { font-size: 11px; font-weight: 600; text-transform: uppercase; letter-spacing: .6px; color: var(--text-secondary); }
+        .field-input {
+            padding: 9px 14px; border: 1px solid var(--border); border-radius: var(--radius-sm);
+            font-size: 13px; outline: none; transition: border-color .15s;
+            background: var(--bg); color: var(--text-primary);
+        }
+        .field-input:focus { border-color: var(--accent); background: #fff; }
+
+        .status-bar {
+            padding: 10px 14px; border-radius: var(--radius-sm);
+            font-size: 12.5px; font-weight: 500; margin-bottom: 16px;
+            display: flex; align-items: center; gap: 8px;
+        }
+        .status-idle    { background: #f1f5f9; color: var(--text-secondary); }
+        .status-running { background: #eff6ff; color: #1d4ed8; border: 1px solid #bfdbfe; }
+        .status-ok      { background: #dcfce7; color: #15803d; border: 1px solid #bbf7d0; }
+        .status-fail    { background: #fee2e2; color: #dc2626; border: 1px solid #fecaca; }
+
+        /* ── Result panel ── */
+        .result-grid {
+            display: grid; grid-template-columns: 1fr 1fr; gap: 16px; margin-bottom: 16px;
+        }
+        @media (max-width: 700px) { .result-grid { grid-template-columns: 1fr; } }
+        .result-section { }
+        .result-label { font-size: 10.5px; font-weight: 700; text-transform: uppercase; letter-spacing: .7px; color: var(--text-muted); margin-bottom: 8px; }
+        .kv-list { display: flex; flex-direction: column; gap: 5px; }
+        .kv-row  { display: flex; align-items: baseline; gap: 8px; }
+        .kv-key  { font-size: 11.5px; color: var(--text-secondary); min-width: 90px; flex-shrink: 0; }
+        .kv-val  { font-size: 13px; font-weight: 600; color: var(--text-primary); font-family: monospace; }
+
+        /* ── HITL panel ── */
+        .hitl-panel {
+            border: 2px solid #f59e0b; border-radius: var(--radius);
+            background: #fffbeb; padding: 18px 20px;
+            margin-bottom: 16px;
+        }
+        .hitl-title {
+            font-size: 14px; font-weight: 700; color: #92400e; margin-bottom: 6px;
+            display: flex; align-items: center; gap: 8px;
+        }
+        .hitl-subtitle { font-size: 12px; color: #78350f; margin-bottom: 14px; }
+        .hitl-buttons  { display: flex; gap: 10px; flex-wrap: wrap; }
+        .hitl-note     { font-size: 11.5px; color: var(--text-secondary); margin-top: 10px; }
+
+        .verdict-ok   { background: #dcfce7; color: #15803d; border: 1px solid #bbf7d0; border-radius: 8px; padding: 8px 16px; font-weight: 700; font-size: 13px; display: inline-flex; align-items: center; gap: 6px; }
+        .verdict-fail { background: #fee2e2; color: #dc2626; border: 1px solid #fecaca; border-radius: 8px; padding: 8px 16px; font-weight: 700; font-size: 13px; display: inline-flex; align-items: center; gap: 6px; }
+        .verdict-pending { background: #fffbeb; color: #92400e; border: 1px solid #fde68a; border-radius: 8px; padding: 8px 16px; font-weight: 700; font-size: 13px; display: inline-flex; align-items: center; gap: 6px; }
+
+        /* ── KPI row ── */
+        .kpi-row { display: flex; gap: 14px; margin-bottom: 22px; flex-wrap: wrap; }
+        .kpi-tile {
+            background: var(--surface); border: 1px solid var(--border);
+            border-radius: var(--radius); padding: 14px 18px; box-shadow: var(--shadow);
+            flex: 1; min-width: 130px; position: relative; overflow: hidden;
+        }
+        .kpi-tile::before { content:''; position: absolute; top:0;left:0;right:0;height:3px;background:var(--t-accent,#6366f1); }
+        .kpi-val { font-size: 28px; font-weight: 700; line-height: 1; margin-bottom: 5px; font-variant-numeric: tabular-nums; }
+        .kpi-lbl { font-size: 11px; font-weight: 600; text-transform: uppercase; letter-spacing: .6px; color: var(--text-secondary); }
+
+        /* ── History table ── */
+        .table-wrap { overflow-x: auto; max-height: 480px; overflow-y: auto; }
+        .table-wrap::-webkit-scrollbar { width: 5px; height: 5px; }
+        .table-wrap::-webkit-scrollbar-thumb { background: #cbd5e1; border-radius: 3px; }
+        table { width: 100%; border-collapse: collapse; font-size: 13px; }
+        thead tr { position: sticky; top: 0; z-index: 10; }
+        th {
+            background: #f8fafc; color: var(--text-secondary); font-size: 10.5px;
+            font-weight: 700; text-transform: uppercase; letter-spacing: .7px;
+            padding: 10px 14px; text-align: left; border-bottom: 2px solid var(--border);
+            white-space: nowrap;
+        }
+        td { padding: 10px 14px; border-bottom: 1px solid #f1f5f9; vertical-align: middle; }
+        tbody tr:hover td { background: #f8fafc; }
+        tbody tr:last-child td { border-bottom: none; }
+        .no-data-row td { text-align: center; padding: 38px 20px; color: var(--text-muted); font-style: italic; }
+
+        /* ── Chips ── */
+        .chip { display: inline-flex; align-items: center; gap: 3px; padding: 2px 8px; border-radius: 10px; font-size: 11px; font-weight: 600; white-space: nowrap; }
+        .chip-ok    { background: #dcfce7; color: #15803d; }
+        .chip-fail  { background: #fee2e2; color: #dc2626; }
+        .chip-warn  { background: #fffbeb; color: #92400e; }
+        .chip-muted { background: #f1f5f9; color: #64748b; }
+        .chip-label { background: #ede9fe; color: #6d28d9; }
+        .mono { font-family: monospace; font-size: 11.5px; color: var(--text-secondary); }
+        .ts   { font-size: 11px; color: var(--text-muted); white-space: nowrap; }
+
+        /* ── Conf bar ── */
+        .conf-bar { display: flex; align-items: center; gap: 7px; }
+        .conf-track { width: 56px; height: 5px; background: #e2e8f0; border-radius: 3px; overflow: hidden; flex-shrink: 0; }
+        .conf-fill { height: 100%; border-radius: 3px; }
+        .conf-fill.high { background: var(--ok); }
+        .conf-fill.med  { background: var(--warn); }
+        .conf-fill.low  { background: var(--fail); }
+        .conf-num { font-size: 12px; font-weight: 600; min-width: 34px; font-variant-numeric: tabular-nums; }
+        .conf-num.high { color: #15803d; }
+        .conf-num.med  { color: #92400e; }
+        .conf-num.low  { color: #b91c1c; }
+
+        .footer {
+            border-top: 1px solid var(--border); padding: 11px 28px;
+            display: flex; align-items: center; justify-content: space-between;
+            font-size: 11px; color: var(--text-muted); background: var(--surface);
+        }
+
+        /* ── Spinner ── */
+        .spinner {
+            width: 16px; height: 16px; border: 2px solid #bfdbfe;
+            border-top-color: #1d4ed8; border-radius: 50%;
+            animation: spin .7s linear infinite; flex-shrink: 0;
+        }
+        @keyframes spin { to { transform: rotate(360deg); } }
+
+        /* ── Accuracy badge in history table ── */
+        tr.verdict-row-ok   td:first-child { border-left: 3px solid var(--ok); }
+        tr.verdict-row-fail td:first-child { border-left: 3px solid var(--fail); }
+        tr.verdict-row-none td:first-child { border-left: 3px solid transparent; }
+    </style>
+</head>
+<body>
+
+<!-- ══ SIDEBAR ══ -->
+<nav id="sidebar">
+    <div class="sb-brand">
+        <div class="sb-brand-title">Vision Pipeline<br>Research Dashboard</div>
+        <div class="sb-brand-sub">ROS 2 · Real-time Monitor</div>
+    </div>
+    <div class="sb-live"><div class="live-dot"></div>Live · auto-refresh</div>
+
+    <div class="sb-group">Navigation</div>
+    <div class="sb-link" onclick="window.location.href='index.html'">
+        <div class="sb-dot" style="background:#64748b"></div>
+        Main Dashboard
+    </div>
+    <div class="sb-link active">
+        <div class="sb-dot" style="background:var(--accent)"></div>
+        Find Object
+        <span class="sb-count" id="nav-total">0</span>
+    </div>
+
+    <div class="sb-group">Stats</div>
+    <div class="sb-link" onclick="scrollTo('sec-trigger')">
+        <div class="sb-dot" style="background:#10b981"></div>
+        Trigger Service
+    </div>
+    <div class="sb-link" onclick="scrollTo('sec-hitl')">
+        <div class="sb-dot" style="background:#f59e0b"></div>
+        Human-in-the-Loop
+        <span class="sb-count" id="nav-pending">0</span>
+    </div>
+    <div class="sb-link" onclick="scrollTo('sec-history')">
+        <div class="sb-dot" style="background:var(--accent)"></div>
+        Call History
+        <span class="sb-count" id="nav-history">0</span>
+    </div>
+    <div class="sb-link" onclick="scrollTo('sec-accuracy')">
+        <div class="sb-dot" style="background:#ec4899"></div>
+        Accuracy Report
+    </div>
+</nav>
+
+<!-- ══ MAIN ══ -->
+<div id="main">
+
+    <div id="topbar">
+        <div>
+            <div class="topbar-title">Find Object — Service Benchmark</div>
+            <div class="topbar-sub">/find_object · SAM + CLIP + OBB + Pixel-to-Real · Human-in-the-Loop accuracy</div>
+        </div>
+        <div class="topbar-right">
+            <div class="sb-live" style="border:1px solid var(--border);border-radius:20px;padding:5px 13px;background:var(--bg);">
+                <div class="live-dot"></div>
+                <span style="font-size:12px;color:var(--text-secondary)">Auto-refresh 3 s</span>
+            </div>
+            <button class="btn" onclick="clearHistory()">Clear History</button>
+        </div>
+    </div>
+
+    <div class="page-body">
+
+        <!-- ── KPI row ── -->
+        <div class="kpi-row">
+            <div class="kpi-tile" style="--t-accent:#6366f1">
+                <div class="kpi-val" id="kpiTotal">0</div>
+                <div class="kpi-lbl">Total Calls</div>
+            </div>
+            <div class="kpi-tile" style="--t-accent:#22c55e">
+                <div class="kpi-val" id="kpiSuccess">0</div>
+                <div class="kpi-lbl">Succeeded</div>
+            </div>
+            <div class="kpi-tile" style="--t-accent:#ef4444">
+                <div class="kpi-val" id="kpiFailed">0</div>
+                <div class="kpi-lbl">Failed</div>
+            </div>
+            <div class="kpi-tile" style="--t-accent:#ec4899">
+                <div class="kpi-val" id="kpiAccuracy">—</div>
+                <div class="kpi-lbl">HITL Accuracy</div>
+            </div>
+            <div class="kpi-tile" style="--t-accent:#f59e0b">
+                <div class="kpi-val" id="kpiPending">0</div>
+                <div class="kpi-lbl">Pending Review</div>
+            </div>
+            <div class="kpi-tile" style="--t-accent:#06b6d4">
+                <div class="kpi-val" id="kpiAvgConf">—</div>
+                <div class="kpi-lbl">Avg Confidence</div>
+            </div>
+        </div>
+
+        <!-- ── Trigger panel ── -->
+        <div id="sec-trigger" class="card">
+            <div class="card-head">
+                <div class="card-accent" style="background:#10b981"></div>
+                <div>
+                    <div class="card-title">Trigger /find_object Service</div>
+                    <div class="card-subtitle">ros2 service call /find_object custom_interfaces/srv/FindObjectReal "{label: '...'}"</div>
+                </div>
+            </div>
+            <div class="card-body">
+                <div class="trigger-grid">
+                    <div class="field-group">
+                        <div class="field-label">Object Label</div>
+                        <input id="labelInput" class="field-input" type="text" placeholder="e.g.  bowl, cup, bottle, box" value="bowl"
+                               onkeydown="if(event.key==='Enter') triggerService()">
+                    </div>
+                    <button class="btn btn-primary" onclick="triggerService()" id="triggerBtn">
+                        ▶ Call Service
+                    </button>
+                </div>
+                <div id="statusBar" class="status-bar status-idle">Ready — enter a label and press Call Service.</div>
+
+                <!-- Live result ── shown after a successful call -->
+                <div id="resultBlock" style="display:none">
+                    <div class="result-grid">
+                        <div class="result-section">
+                            <div class="result-label">Detection</div>
+                            <div class="kv-list">
+                                <div class="kv-row"><span class="kv-key">Label searched</span><span class="kv-val" id="resLabel">—</span></div>
+                                <div class="kv-row"><span class="kv-key">Object ID</span><span class="kv-val" id="resObjId">—</span></div>
+                                <div class="kv-row"><span class="kv-key">Confidence</span><span class="kv-val" id="resConf">—</span></div>
+                                <div class="kv-row"><span class="kv-key">Bounding Box</span><span class="kv-val" id="resBBox">—</span></div>
+                                <div class="kv-row"><span class="kv-key">Status</span><span class="kv-val" id="resStatus">—</span></div>
+                            </div>
+                        </div>
+                        <div class="result-section">
+                            <div class="result-label">World Coordinates + Angle</div>
+                            <div class="kv-list">
+                                <div class="kv-row"><span class="kv-key">X (m)</span><span class="kv-val" id="resX">—</span></div>
+                                <div class="kv-row"><span class="kv-key">Y (m)</span><span class="kv-val" id="resY">—</span></div>
+                                <div class="kv-row"><span class="kv-key">Z (m)</span><span class="kv-val" id="resZ">—</span></div>
+                                <div class="kv-row"><span class="kv-key">θ (rad)</span><span class="kv-val" id="resTheta">—</span></div>
+                                <div class="kv-row"><span class="kv-key">θ (deg)</span><span class="kv-val" id="resThetaDeg">—</span></div>
+                            </div>
+                        </div>
+                    </div>
+                    <div class="result-section" style="margin-bottom:12px">
+                        <div class="result-label">Message from service</div>
+                        <div id="resMessage" style="font-size:12.5px;color:var(--text-secondary);background:var(--bg);padding:10px 14px;border-radius:var(--radius-sm);font-family:monospace;word-break:break-all"></div>
+                    </div>
+                </div>
+            </div>
+        </div>
+
+        <!-- ── Human-in-the-Loop panel ── -->
+        <div id="sec-hitl" class="card">
+            <div class="card-head">
+                <div class="card-accent" style="background:#f59e0b"></div>
+                <div>
+                    <div class="card-title">Human-in-the-Loop Verification</div>
+                    <div class="card-subtitle">Review latest detection result — mark as correct or incorrect</div>
+                </div>
+                <span class="card-badge" id="hitlBadge" style="background:#f59e0b">Waiting for call…</span>
+            </div>
+            <div class="card-body">
+                <div id="hitlEmpty" style="color:var(--text-muted);font-style:italic;font-size:13px">
+                    No result to review yet. Trigger the service above first.
+                </div>
+                <div id="hitlContent" style="display:none">
+                    <div class="hitl-panel">
+                        <div class="hitl-title">
+                            <span>&#128270;</span>
+                            Was the detected object correct?
+                        </div>
+                        <div class="hitl-subtitle" id="hitlQuestion">
+                            Service returned: <strong id="hitlObjLabel">—</strong> (ID: <span id="hitlObjId">—</span>)
+                            at world position (<span id="hitlXYZ">—</span>), θ = <span id="hitlTheta">—</span> rad
+                        </div>
+                        <div id="hitlVerdictDisplay"></div>
+                        <div class="hitl-buttons" id="hitlButtons">
+                            <button class="btn btn-ok" onclick="submitVerdict(true)">&#10003; Correct — Object matches label</button>
+                            <button class="btn btn-fail" onclick="submitVerdict(false)">&#10007; Incorrect — Wrong / missing object</button>
+                        </div>
+                        <div class="hitl-note" id="hitlNote">Your verdict will be recorded against this call in the history table.</div>
+                    </div>
+                </div>
+            </div>
+        </div>
+
+        <!-- ── Call History ── -->
+        <div id="sec-history" class="card">
+            <div class="card-head">
+                <div class="card-accent" style="background:var(--accent)"></div>
+                <div>
+                    <div class="card-title">Call History</div>
+                    <div class="card-subtitle">find_object_history.json · newest first · max 50 calls</div>
+                </div>
+                <span class="card-badge" id="historyBadge" style="background:var(--accent)">0 Calls</span>
+            </div>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>#</th>
+                        <th>Timestamp</th>
+                        <th>Label</th>
+                        <th>Object ID</th>
+                        <th>Confidence</th>
+                        <th>Bounding Box</th>
+                        <th>X (m)</th>
+                        <th>Y (m)</th>
+                        <th>Z (m)</th>
+                        <th>θ (deg)</th>
+                        <th>Service OK</th>
+                        <th>HITL Verdict</th>
+                        <th>Verify</th>
+                        <th>Message</th>
+                    </tr></thead>
+                    <tbody id="historyBody">
+                        <tr class="no-data-row"><td colspan="14">No calls yet — trigger the service above.</td></tr>
+                    </tbody>
+                </table>
+            </div>
+        </div>
+
+        <!-- ── Accuracy Report ── -->
+        <div id="sec-accuracy" class="card">
+            <div class="card-head">
+                <div class="card-accent" style="background:#ec4899"></div>
+                <div>
+                    <div class="card-title">Accuracy Report</div>
+                    <div class="card-subtitle">Per-label breakdown from human-in-the-loop verdicts</div>
+                </div>
+            </div>
+            <div class="table-wrap">
+                <table>
+                    <thead><tr>
+                        <th>Label</th>
+                        <th>Total Calls</th>
+                        <th>Succeeded</th>
+                        <th>Failed</th>
+                        <th>Reviewed</th>
+                        <th>Correct</th>
+                        <th>Incorrect</th>
+                        <th>HITL Accuracy</th>
+                        <th>Avg Confidence</th>
+                    </tr></thead>
+                    <tbody id="accuracyBody">
+                        <tr class="no-data-row"><td colspan="9">No data yet.</td></tr>
+                    </tbody>
+                </table>
+            </div>
+        </div>
+
+    </div><!-- /page-body -->
+
+    <div class="footer">
+        <span>Find Object Benchmark · Vision Pipeline · ROS 2</span>
+        <span>Last updated: <span id="lastUpdated">—</span></span>
+    </div>
+</div><!-- /main -->
+
+<script>
+// ── State ──────────────────────────────────────────────────────────────────
+let history    = [];          // all calls loaded from server
+let pendingIdx = null;        // index into history[] awaiting HITL verdict
+
+// ── Utilities ──────────────────────────────────────────────────────────────
+function confClass(v) { return v >= 0.7 ? 'high' : v >= 0.4 ? 'med' : 'low'; }
+function confBar(v) {
+    if (v == null || v === '') return '<span style="color:var(--text-muted)">—</span>';
+    const cls = confClass(v), pct = Math.min(100, Math.round(v * 100));
+    return `<div class="conf-bar">
+        <div class="conf-track"><div class="conf-fill ${cls}" style="width:${pct}%"></div></div>
+        <span class="conf-num ${cls}">${Number(v).toFixed(3)}</span>
+    </div>`;
+}
+function tsShort(t) {
+    if (!t) return '<span class="ts">—</span>';
+    return `<span class="ts">${new Date(t).toLocaleString()}</span>`;
+}
+function scrollTo(id) {
+    const el = document.getElementById(id);
+    if (el) el.scrollIntoView({ behavior: 'smooth', block: 'start' });
+}
+function setStatus(type, msg) {
+    const el = document.getElementById('statusBar');
+    el.className = 'status-bar status-' + type;
+    el.innerHTML = type === 'running'
+        ? `<div class="spinner"></div> ${msg}`
+        : msg;
+}
+
+// ── Trigger service ────────────────────────────────────────────────────────
+async function triggerService() {
+    const label = document.getElementById('labelInput').value.trim();
+    if (!label) { setStatus('fail', '&#9888; Please enter an object label.'); return; }
+
+    document.getElementById('triggerBtn').disabled = true;
+    document.getElementById('resultBlock').style.display = 'none';
+    setStatus('running', `Calling /find_object with label "<strong>${label}</strong>"…`);
+
+    try {
+        const res  = await fetch('/api/find-object', {
+            method:  'POST',
+            headers: { 'Content-Type': 'application/json' },
+            body:    JSON.stringify({ label })
+        });
+        const data = await res.json();
+
+        if (data.error) {
+            setStatus('fail', '&#10007; ' + data.error);
+        } else if (data.success) {
+            setStatus('ok', `&#10003; Found "<strong>${label}</strong>" — confidence ${Number(data.confidence).toFixed(3)}`);
+        } else {
+            setStatus('fail', `&#10007; Service returned failure — ${data.message}`);
+        }
+
+        // Populate live result block
+        showResult(data, label);
+
+        // Reload history (server appended new entry)
+        await loadHistory();
+
+        // Point HITL to the new entry
+        if (history.length) {
+            pendingIdx = history.length - 1;
+            showHITL(history[pendingIdx]);
+        }
+
+    } catch (e) {
+        setStatus('fail', '&#10007; Network/server error: ' + e.message);
+    } finally {
+        document.getElementById('triggerBtn').disabled = false;
+    }
+}
+
+function showResult(data, label) {
+    const rb = document.getElementById('resultBlock');
+    rb.style.display = 'block';
+    document.getElementById('resLabel').textContent    = label;
+    document.getElementById('resObjId').textContent    = data.object_id || '—';
+    document.getElementById('resConf').innerHTML       = confBar(data.confidence);
+    const bb = data.bbox || [];
+    document.getElementById('resBBox').textContent     = bb.length >= 4
+        ? `[${bb[0]}, ${bb[1]}, ${bb[2]}, ${bb[3]}]` : '—';
+    document.getElementById('resStatus').innerHTML     = data.success
+        ? '<span class="chip chip-ok">&#10003; Success</span>'
+        : '<span class="chip chip-fail">&#10007; Failed</span>';
+    document.getElementById('resX').textContent        = data.x != null ? Number(data.x).toFixed(4) : '—';
+    document.getElementById('resY').textContent        = data.y != null ? Number(data.y).toFixed(4) : '—';
+    document.getElementById('resZ').textContent        = data.z != null ? Number(data.z).toFixed(4) : '—';
+    document.getElementById('resTheta').textContent    = data.theta != null ? Number(data.theta).toFixed(4) : '—';
+    document.getElementById('resThetaDeg').textContent = data.theta != null
+        ? (Number(data.theta) * 180 / Math.PI).toFixed(2) + '°' : '—';
+    document.getElementById('resMessage').textContent  = data.message || '';
+}
+
+// ── Human-in-the-Loop ─────────────────────────────────────────────────────
+function showHITL(entry) {
+    document.getElementById('hitlEmpty').style.display   = 'none';
+    document.getElementById('hitlContent').style.display = 'block';
+
+    const bb = entry.bbox || [];
+    document.getElementById('hitlObjLabel').textContent = entry.label_searched || '—';
+    document.getElementById('hitlObjId').textContent    = entry.object_id || '—';
+    document.getElementById('hitlXYZ').textContent      =
+        `${Number(entry.x||0).toFixed(3)}, ${Number(entry.y||0).toFixed(3)}, ${Number(entry.z||0).toFixed(3)}`;
+    document.getElementById('hitlTheta').textContent    = Number(entry.theta||0).toFixed(4);
+
+    const vd = document.getElementById('hitlVerdictDisplay');
+    const bt = document.getElementById('hitlButtons');
+    const nt = document.getElementById('hitlNote');
+
+    if (entry.verdict === true) {
+        vd.innerHTML = '<div class="verdict-ok">&#10003; Marked CORRECT</div>';
+        bt.style.display = 'none';
+        nt.textContent   = 'Verdict already recorded.';
+        document.getElementById('hitlBadge').textContent = 'Verified ✓';
+    } else if (entry.verdict === false) {
+        vd.innerHTML = '<div class="verdict-fail">&#10007; Marked INCORRECT</div>';
+        bt.style.display = 'none';
+        nt.textContent   = 'Verdict already recorded.';
+        document.getElementById('hitlBadge').textContent = 'Verified ✗';
+    } else {
+        vd.innerHTML = '<div class="verdict-pending">&#9203; Awaiting review</div>';
+        bt.style.display = 'flex';
+        nt.textContent   = 'Your verdict will be recorded against this call.';
+        document.getElementById('hitlBadge').textContent = 'Needs Review';
+    }
+}
+
+async function submitVerdict(correct) {
+    if (pendingIdx === null || pendingIdx >= history.length) return;
+    const entry = history[pendingIdx];
+
+    try {
+        const res  = await fetch('/api/find-object-verdict', {
+            method:  'POST',
+            headers: { 'Content-Type': 'application/json' },
+            body:    JSON.stringify({ call_id: entry.call_id, verdict: correct })
+        });
+        const data = await res.json();
+        if (data.ok) {
+            entry.verdict = correct;
+            showHITL(entry);
+            await loadHistory();
+        } else {
+            alert('Failed to save verdict: ' + (data.error || 'unknown error'));
+        }
+    } catch (e) {
+        alert('Network error: ' + e.message);
+    }
+}
+
+// ── Load history from server ───────────────────────────────────────────────
+async function loadHistory() {
+    try {
+        const res  = await fetch('/api/find-object-history');
+        const data = await res.json();
+        history = Array.isArray(data) ? data : [];
+        renderAll();
+    } catch (e) {
+        console.warn('History unavailable:', e);
+    }
+}
+
+// ── Render ─────────────────────────────────────────────────────────────────
+function renderAll() {
+    renderKPIs();
+    renderHistoryTable();
+    renderAccuracyReport();
+    document.getElementById('lastUpdated').textContent = new Date().toLocaleTimeString();
+}
+
+function renderKPIs() {
+    const total   = history.length;
+    const success = history.filter(h => h.success).length;
+    const failed  = total - success;
+    const reviewed = history.filter(h => h.verdict !== null && h.verdict !== undefined);
+    const correct  = reviewed.filter(h => h.verdict === true).length;
+    const pending  = history.filter(h => h.verdict === null || h.verdict === undefined).length;
+    const accuracy = reviewed.length ? (correct / reviewed.length * 100).toFixed(1) + '%' : '—';
+    const confs    = history.filter(h => h.confidence != null).map(h => h.confidence);
+    const avgConf  = confs.length ? (confs.reduce((s,v)=>s+v,0)/confs.length).toFixed(3) : '—';
+
+    document.getElementById('kpiTotal').textContent    = total;
+    document.getElementById('kpiSuccess').textContent  = success;
+    document.getElementById('kpiFailed').textContent   = failed;
+    document.getElementById('kpiAccuracy').textContent = accuracy;
+    document.getElementById('kpiPending').textContent  = pending;
+    document.getElementById('kpiAvgConf').textContent  = avgConf;
+    document.getElementById('nav-total').textContent   = total;
+    document.getElementById('nav-pending').textContent = pending;
+    document.getElementById('nav-history').textContent = total;
+    document.getElementById('historyBadge').textContent = `${total} Calls`;
+}
+
+function renderHistoryTable() {
+    const tbody = document.getElementById('historyBody');
+    if (!history.length) {
+        tbody.innerHTML = '<tr class="no-data-row"><td colspan="14">No calls yet — trigger the service above.</td></tr>';
+        return;
+    }
+    const rows = history.slice().reverse().map((entry, revIdx) => {
+        const origIdx = history.length - 1 - revIdx;
+        const bb      = entry.bbox || [];
+        const bboxStr = bb.length >= 4 ? `[${bb[0]},${bb[1]},${bb[2]},${bb[3]}]` : '—';
+        const thetaDeg = entry.theta != null ? (Number(entry.theta)*180/Math.PI).toFixed(1)+'°' : '—';
+
+        let verdictChip = '<span class="chip chip-warn">&#9203; Pending</span>';
+        let rowClass    = 'verdict-row-none';
+        if (entry.verdict === true)  { verdictChip = '<span class="chip chip-ok">&#10003; Correct</span>';   rowClass = 'verdict-row-ok'; }
+        if (entry.verdict === false) { verdictChip = '<span class="chip chip-fail">&#10007; Incorrect</span>'; rowClass = 'verdict-row-fail'; }
+
+        const canVerify = (entry.verdict === null || entry.verdict === undefined);
+        const verifyBtns = canVerify
+            ? `<button class="btn btn-ok btn-sm" onclick="quickVerdict(${origIdx},true)" title="Mark correct">&#10003;</button>
+               <button class="btn btn-fail btn-sm" onclick="quickVerdict(${origIdx},false)" style="margin-left:4px" title="Mark incorrect">&#10007;</button>`
+            : '<span style="color:var(--text-muted);font-size:11px">Done</span>';
+
+        return `<tr class="${rowClass}">
+            <td class="mono">${entry.call_id || origIdx+1}</td>
+            <td>${tsShort(entry.timestamp)}</td>
+            <td><span class="chip chip-label">${entry.label_searched || '—'}</span></td>
+            <td class="mono">${entry.object_id || '—'}</td>
+            <td>${confBar(entry.confidence)}</td>
+            <td class="mono" style="font-size:11px">${bboxStr}</td>
+            <td class="mono">${entry.x != null ? Number(entry.x).toFixed(3) : '—'}</td>
+            <td class="mono">${entry.y != null ? Number(entry.y).toFixed(3) : '—'}</td>
+            <td class="mono">${entry.z != null ? Number(entry.z).toFixed(3) : '—'}</td>
+            <td class="mono">${thetaDeg}</td>
+            <td>${entry.success ? '<span class="chip chip-ok">&#10003;</span>' : '<span class="chip chip-fail">&#10007;</span>'}</td>
+            <td>${verdictChip}</td>
+            <td style="white-space:nowrap">${verifyBtns}</td>
+            <td style="max-width:220px;font-size:11.5px;color:var(--text-secondary);word-break:break-word">${entry.message||''}</td>
+        </tr>`;
+    });
+    tbody.innerHTML = rows.join('');
+}
+
+async function quickVerdict(idx, correct) {
+    const entry = history[idx];
+    if (!entry) return;
+    try {
+        const res  = await fetch('/api/find-object-verdict', {
+            method:  'POST',
+            headers: { 'Content-Type': 'application/json' },
+            body:    JSON.stringify({ call_id: entry.call_id, verdict: correct })
+        });
+        const data = await res.json();
+        if (data.ok) {
+            entry.verdict = correct;
+            // If this is also the HITL panel entry, refresh it
+            if (pendingIdx === idx) showHITL(entry);
+            renderAll();
+        }
+    } catch (e) { console.warn('Verdict failed:', e); }
+}
+
+function renderAccuracyReport() {
+    const tbody = document.getElementById('accuracyBody');
+    if (!history.length) {
+        tbody.innerHTML = '<tr class="no-data-row"><td colspan="9">No data yet.</td></tr>';
+        return;
+    }
+
+    const byLabel = {};
+    for (const entry of history) {
+        const lbl = entry.label_searched || 'unknown';
+        if (!byLabel[lbl]) byLabel[lbl] = { total:0, success:0, failed:0, reviewed:0, correct:0, incorrect:0, confs:[] };
+        const b = byLabel[lbl];
+        b.total++;
+        entry.success ? b.success++ : b.failed++;
+        if (entry.verdict === true)  { b.reviewed++; b.correct++;   }
+        if (entry.verdict === false) { b.reviewed++; b.incorrect++; }
+        if (entry.confidence != null) b.confs.push(entry.confidence);
+    }
+
+    const rows = Object.entries(byLabel).sort((a,b)=>b[1].total-a[1].total).map(([lbl, b]) => {
+        const hitlAcc = b.reviewed ? (b.correct/b.reviewed*100).toFixed(1)+'%' : '—';
+        const avgConf = b.confs.length ? confBar(b.confs.reduce((s,v)=>s+v,0)/b.confs.length) : '—';
+        return `<tr>
+            <td><span class="chip chip-label">${lbl}</span></td>
+            <td class="mono">${b.total}</td>
+            <td class="mono" style="color:#15803d">${b.success}</td>
+            <td class="mono" style="color:#dc2626">${b.failed}</td>
+            <td class="mono">${b.reviewed}</td>
+            <td class="mono" style="color:#15803d">${b.correct}</td>
+            <td class="mono" style="color:#dc2626">${b.incorrect}</td>
+            <td>${b.reviewed
+                ? `<div class="conf-bar"><div class="conf-track"><div class="conf-fill ${b.correct/b.reviewed>=.7?'high':b.correct/b.reviewed>=.4?'med':'low'}" style="width:${Math.round(b.correct/b.reviewed*100)}%"></div></div><span class="conf-num ${b.correct/b.reviewed>=.7?'high':b.correct/b.reviewed>=.4?'med':'low'}">${hitlAcc}</span></div>`
+                : '—'}</td>
+            <td>${avgConf}</td>
+        </tr>`;
+    });
+    tbody.innerHTML = rows.join('');
+}
+
+// ── Clear history ─────────────────────────────────────────────────────────
+async function clearHistory() {
+    if (!confirm('Clear all find_object call history?')) return;
+    try {
+        await fetch('/api/find-object-clear', { method: 'POST' });
+        history = [];
+        pendingIdx = null;
+        document.getElementById('hitlEmpty').style.display   = 'block';
+        document.getElementById('hitlContent').style.display = 'none';
+        document.getElementById('hitlBadge').textContent     = 'Waiting for call…';
+        renderAll();
+    } catch (e) { alert('Clear failed: ' + e.message); }
+}
+
+// ── Auto-poll ─────────────────────────────────────────────────────────────
+loadHistory();
+setInterval(loadHistory, 3000);
+</script>
+</body>
+</html>
diff --git a/dashboard/index.html b/dashboard/index.html
index a3bd85d..241e612 100644
--- a/dashboard/index.html
+++ b/dashboard/index.html
@@ -511,6 +511,10 @@
         <div class="sb-dot" style="background:#6366f1"></div>
         Object Explorer
     </div>
+    <div class="sb-link" onclick="window.location.href='find_object.html'">
+        <div class="sb-dot" style="background:#10b981"></div>
+        Find Object (HITL)
+    </div>
 </nav>
 
 <!-- ══════════════════════════════════ MAIN ═════════════════════════════════ -->
@@ -539,7 +543,7 @@
             <div class="kpi-card" style="--accent:var(--color-runs)">
                 <div class="kpi-value" id="runHistoryCount">0</div>
                 <div class="kpi-label">Stored Runs</div>
-                <div class="kpi-sub">Rolling last 20</div>
+                <div class="kpi-sub">Rolling last 50</div>
             </div>
             <div class="kpi-card" style="--accent:var(--color-sam)">
                 <div class="kpi-value" id="samCount">0</div>
@@ -580,7 +584,7 @@
                 <div class="section-accent" style="background:var(--color-runs)"></div>
                 <div>
                     <div class="section-title">Vision Run Summary</div>
-                    <div class="section-subtitle">vision_runs_history.json · newest first · max 20 runs</div>
+                    <div class="section-subtitle">vision_runs_history.json · newest first · max 50 runs</div>
                 </div>
                 <span class="section-badge" id="runHistoryBadge" style="background:var(--color-runs)">0 Runs</span>
             </div>
@@ -1049,9 +1053,31 @@
         updateCLIPClassifications(data.clip_classifications);
         updateGraspDetections(data.grasp_detections);
         updateSceneUnderstanding(data.scene_understanding);
+
+        // OBB live records from /api/data (synced from vision_runs_history.json)
+        if (data.obb_detections && data.obb_detections.length) {
+            updateOBBFromLiveData(data.obb_detections);
+        }
+
         document.getElementById('lastUpdated').textContent = new Date().toLocaleTimeString();
     }
 
+    function updateOBBFromLiveData(records) {
+        // Populate OBB section metrics from the live /api/data feed
+        // (the table itself is rendered by updateOBBSection from run history)
+        if (!records.length) return;
+        const angles = records.map(r => r.angle_deg).filter(a => a != null);
+        if (!angles.length) return;
+        const avg = angles.reduce((s, v) => s + v, 0) / angles.length;
+        document.getElementById('obbAvgAngle').textContent = avg.toFixed(1) + '°';
+        document.getElementById('obbMinAngle').textContent = Math.min(...angles).toFixed(1) + '°';
+        document.getElementById('obbMaxAngle').textContent = Math.max(...angles).toFixed(1) + '°';
+        document.getElementById('obbTotalObjects').textContent = records.length;
+        document.getElementById('obbBadge').textContent = `${records.length} Objects`;
+        setNav('nav-obb', records.length);
+        document.getElementById('obbCount').textContent = records.length;
+    }
+
     // ── Pixel to Real ─────────────────────────────────────────────────────────
     function updatePixelToReal(records) {
         document.getElementById('pixelBadge').textContent = `${records.length} Records`;
diff --git a/vision/benchmark_dashboard.py b/vision/benchmark_dashboard.py
index beca947..67ef805 100644
--- a/vision/benchmark_dashboard.py
+++ b/vision/benchmark_dashboard.py
@@ -75,6 +75,7 @@ def __init__(self):
             'sam_detections': [],
             'clip_classifications': [],
             'grasp_detections': [],
+            'obb_detections': [],
             'scene_understanding': [],
             'metadata': {
                 'start_time': datetime.now().isoformat(),
@@ -147,7 +148,10 @@ def __init__(self):
         
         # Timer to publish data periodically
         self.publish_timer = self.create_timer(1.0, self.publish_data)
-        
+
+        # Timer to sync CLIP/OBB/GraspNet/Pixel-to-Real from vision_runs_history.json
+        self.sync_timer = self.create_timer(2.0, self.sync_from_run_history)
+
         # Start HTTP server in separate thread
         self.start_http_server()
         
@@ -312,12 +316,125 @@ def add_grasp_detection_record(self, grasp_pose):
         
         self.data['metadata']['total_calls'] += 1
     
+    def sync_from_run_history(self):
+        """Sync CLIP, GraspNet, OBB, and Pixel-to-Real data from vision_runs_history.json
+        so the /api/data endpoint (CLIP / GraspNet / Pixel-to-Real sections) stays populated
+        even when those dedicated service nodes are not running."""
+        try:
+            from pathlib import Path
+            history_file = Path(__file__).parent.parent / 'vision_runs_history.json'
+            if not history_file.exists():
+                return
+
+            with open(history_file, 'r') as f:
+                runs = json.load(f)
+            if not isinstance(runs, list) or not runs:
+                return
+
+            timestamp = datetime.now().isoformat()
+
+            # Rebuild lists from all stored runs (most recent first for display)
+            new_clip   = []
+            new_grasp  = []
+            new_pixel  = []
+            new_obb    = []
+
+            for run in runs:
+                run_ts    = run.get('meta', {}).get('timestamp', timestamp)
+                run_no    = run.get('meta', {}).get('run_no', 0)
+                objects   = run.get('objects', [])
+
+                for obj in objects:
+                    # ── CLIP ──────────────────────────────────────────────────
+                    clip_conf = obj.get('clip_confidence', '')
+                    label     = obj.get('label', '')
+                    if clip_conf != '' and label:
+                        new_clip.append({
+                            'timestamp':    run_ts,
+                            'test_id':      f"{run_no}:{obj.get('object_id', '')}",
+                            'bbox': {
+                                'x1': obj.get('bbox_x1', 0),
+                                'y1': obj.get('bbox_y1', 0),
+                                'x2': obj.get('bbox_x2', 0),
+                                'y2': obj.get('bbox_y2', 0),
+                            },
+                            'label':         label,
+                            'confidence':    float(clip_conf),
+                            'top1_accuracy': float(clip_conf) >= 0.5,
+                        })
+
+                    # ── GraspNet ──────────────────────────────────────────────
+                    grasp = obj.get('grasp', {})
+                    if obj.get('has_grasp') and grasp:
+                        pix = grasp.get('pixel', {})
+                        wld = grasp.get('world', {})
+                        new_grasp.append({
+                            'timestamp':    run_ts,
+                            'test_id':      f"{run_no}:{obj.get('object_id', '')}",
+                            'object_id':    obj.get('object_id', ''),
+                            'pixel_position': {'u': pix.get('u', 0), 'v': pix.get('v', 0)},
+                            'world_position': {
+                                'x': wld.get('x', 0.0),
+                                'y': wld.get('y', 0.0),
+                                'z': wld.get('z', 0.0),
+                            },
+                            'quality_score':     float(grasp.get('quality_score', 0.0)),
+                            'grasp_width':       float(grasp.get('grasp_width', 0.0)),
+                            'approach_direction': grasp.get('approach_direction', ''),
+                            'bbox': [obj.get('bbox_x1', 0), obj.get('bbox_y1', 0),
+                                     obj.get('bbox_x2', 0), obj.get('bbox_y2', 0)],
+                        })
+
+                    # ── Pixel-to-Real ─────────────────────────────────────────
+                    world = obj.get('world', {})
+                    if world and world.get('x') is not None:
+                        new_pixel.append({
+                            'timestamp': run_ts,
+                            'test_id':   f"{run_no}:{obj.get('object_id', '')}",
+                            'input':     {'u': world.get('u', 0), 'v': world.get('v', 0)},
+                            'output':    {'x': float(world.get('x', 0.0)),
+                                          'y': float(world.get('y', 0.0)),
+                                          'z': float(world.get('z', 0.0))},
+                        })
+
+                    # ── OBB ───────────────────────────────────────────────────
+                    obb_angle = obj.get('obb_angle_deg', '')
+                    if obb_angle != '':
+                        new_obb.append({
+                            'timestamp':   run_ts,
+                            'test_id':     f"{run_no}:{obj.get('object_id', '')}",
+                            'object_id':   obj.get('object_id', ''),
+                            'label':       obj.get('label', ''),
+                            'angle_deg':   float(obb_angle),
+                            'theta_rad':   float(obj.get('obb_theta_rad', 0.0)),
+                            'width_px':    float(obj.get('obb_width_px', 0.0)),
+                            'height_px':   float(obj.get('obb_height_px', 0.0)),
+                            'center_u':    float(obj.get('obb_center_u', 0.0)),
+                            'center_v':    float(obj.get('obb_center_v', 0.0)),
+                            'sam_confidence': float(obj.get('sam_confidence', 0.0)),
+                            'bbox': [obj.get('bbox_x1', 0), obj.get('bbox_y1', 0),
+                                     obj.get('bbox_x2', 0), obj.get('bbox_y2', 0)],
+                        })
+
+            # Only update if we got new data (avoids overwriting live topic data with empty)
+            if new_clip:
+                self.data['clip_classifications'] = new_clip[-1000:]
+            if new_grasp:
+                self.data['grasp_detections'] = new_grasp[-1000:]
+            if new_pixel:
+                self.data['pixel_to_real'] = new_pixel[-1000:]
+            if new_obb:
+                self.data['obb_detections'] = new_obb[-1000:]
+
+        except Exception as e:
+            self.get_logger().warn(f'sync_from_run_history failed: {e}')
+
     def publish_data(self):
         """Publish benchmark data to topic"""
         msg = String()
         msg.data = json.dumps(self.data, cls=_ROSJSONEncoder)
         self.data_publisher.publish(msg)
-    
+
     def clear_data_callback(self, request, response):
         """Clear all benchmark data"""
         self.data = {
@@ -325,16 +442,17 @@ def clear_data_callback(self, request, response):
             'sam_detections': [],
             'clip_classifications': [],
             'grasp_detections': [],
+            'obb_detections': [],
             'scene_understanding': [],
             'metadata': {
                 'start_time': datetime.now().isoformat(),
                 'total_calls': 0
             }
         }
-        
+
         response.success = True
         response.message = "Benchmark data cleared"
-        
+
         self.get_logger().info('Benchmark data cleared')
         return response
     
@@ -348,7 +466,7 @@ def start_http_server(self):
         except Exception:
             html_dir = Path(__file__).parent.parent / 'dashboard'
 
-        # History JSON is written by simple_sam_detector next to the installed module
+        # History JSON files written next to the installed module
         package_path = Path(__file__).parent.parent
 
         self.get_logger().info(f'Dashboard HTML dir: {html_dir}')
@@ -360,47 +478,219 @@ def start_http_server(self):
             self.get_logger().warn('Creating basic HTML file...')
             html_dir.mkdir(exist_ok=True)
             self.create_default_html(html_file)
-        
-        # Custom handler that serves files from html_dir and provides data endpoint
+
+        node_logger = self.get_logger()
+
+        # Custom handler that serves files and provides API endpoints
         class DashboardHandler(SimpleHTTPRequestHandler):
             def __init__(self, *args, dashboard_node=None, **kwargs):
                 self.dashboard_node = dashboard_node
                 super().__init__(*args, directory=str(html_dir), **kwargs)
-            
+
+            # ── helpers ────────────────────────────────────────────────────
+            def _json_response(self, data, status=200):
+                body = json.dumps(data, cls=_ROSJSONEncoder).encode()
+                self.send_response(status)
+                self.send_header('Content-type', 'application/json')
+                self.send_header('Access-Control-Allow-Origin', '*')
+                self.end_headers()
+                self.wfile.write(body)
+
+            def _read_json_file(self, path, default):
+                try:
+                    if path.exists():
+                        with open(path, 'r') as f:
+                            return json.load(f)
+                except Exception:
+                    pass
+                return default
+
+            def _write_json_file(self, path, data):
+                with open(path, 'w') as f:
+                    json.dump(data, f, indent=2)
+
+            # ── OPTIONS (CORS pre-flight) ───────────────────────────────────
+            def do_OPTIONS(self):
+                self.send_response(204)
+                self.send_header('Access-Control-Allow-Origin', '*')
+                self.send_header('Access-Control-Allow-Methods', 'GET, POST, OPTIONS')
+                self.send_header('Access-Control-Allow-Headers', 'Content-Type')
+                self.end_headers()
+
+            # ── GET ────────────────────────────────────────────────────────
             def do_GET(self):
                 if self.path == '/api/data':
-                    # Serve benchmark data as JSON
-                    self.send_response(200)
-                    self.send_header('Content-type', 'application/json')
-                    self.send_header('Access-Control-Allow-Origin', '*')
-                    self.end_headers()
-                    data_json = json.dumps(self.dashboard_node.data, cls=_ROSJSONEncoder)
-                    self.wfile.write(data_json.encode())
+                    self._json_response(self.dashboard_node.data)
+
                 elif self.path == '/api/run-history':
-                    # Serve vision_runs_history.json from workspace root
                     history_file = package_path / 'vision_runs_history.json'
-                    self.send_response(200)
-                    self.send_header('Content-type', 'application/json')
-                    self.send_header('Access-Control-Allow-Origin', '*')
-                    self.end_headers()
-                    if history_file.exists():
-                        self.wfile.write(history_file.read_bytes())
-                    else:
-                        self.wfile.write(b'[]')
+                    data = self._read_json_file(history_file, [])
+                    self._json_response(data)
+
+                elif self.path == '/api/find-object-history':
+                    fo_file = package_path / 'find_object_history.json'
+                    data = self._read_json_file(fo_file, [])
+                    self._json_response(data)
+
                 else:
-                    # Serve static files
                     super().do_GET()
-        
+
+            # ── POST ───────────────────────────────────────────────────────
+            def do_POST(self):
+                length = int(self.headers.get('Content-Length', 0))
+                body   = self.rfile.read(length) if length else b'{}'
+                try:
+                    payload = json.loads(body)
+                except Exception:
+                    payload = {}
+
+                if self.path == '/api/find-object':
+                    self._handle_find_object(payload)
+
+                elif self.path == '/api/find-object-verdict':
+                    self._handle_verdict(payload)
+
+                elif self.path == '/api/find-object-clear':
+                    fo_file = package_path / 'find_object_history.json'
+                    self._write_json_file(fo_file, [])
+                    self._json_response({'ok': True})
+
+                else:
+                    self._json_response({'error': 'unknown endpoint'}, 404)
+
+            # ── /api/find-object ──────────────────────────────────────────
+            def _handle_find_object(self, payload):
+                """Call /find_object ROS2 service and persist result."""
+                import subprocess, shlex
+                label = payload.get('label', '').strip()
+                if not label:
+                    self._json_response({'error': 'label is required'}, 400)
+                    return
+
+                fo_file = package_path / 'find_object_history.json'
+                history = self._read_json_file(fo_file, [])
+                call_id = len(history) + 1
+                timestamp = datetime.now().isoformat()
+
+                # Call the ROS2 service via subprocess
+                cmd = (
+                    f"ros2 service call /find_object "
+                    f"custom_interfaces/srv/FindObjectReal "
+                    f"\"{{label: '{label}'}}\""
+                )
+                try:
+                    result = subprocess.run(
+                        cmd, shell=True, capture_output=True, text=True, timeout=30
+                    )
+                    output = result.stdout + result.stderr
+                    node_logger.info(f'find_object [{label}] stdout: {output[:300]}')
+
+                    # Parse the ROS2 CLI response format
+                    entry = _parse_find_object_response(output, label, call_id, timestamp)
+                except subprocess.TimeoutExpired:
+                    entry = {
+                        'call_id': call_id, 'timestamp': timestamp,
+                        'label_searched': label, 'success': False,
+                        'message': 'Service call timed out (30 s)',
+                        'object_id': '', 'bbox': [], 'confidence': 0.0,
+                        'x': 0.0, 'y': 0.0, 'z': 0.0, 'theta': 0.0,
+                        'verdict': None,
+                    }
+                except Exception as e:
+                    entry = {
+                        'call_id': call_id, 'timestamp': timestamp,
+                        'label_searched': label, 'success': False,
+                        'message': f'Error: {e}',
+                        'object_id': '', 'bbox': [], 'confidence': 0.0,
+                        'x': 0.0, 'y': 0.0, 'z': 0.0, 'theta': 0.0,
+                        'verdict': None,
+                    }
+
+                history.append(entry)
+                history = history[-50:]
+                self._write_json_file(fo_file, history)
+                self._json_response(entry)
+
+            # ── /api/find-object-verdict ──────────────────────────────────
+            def _handle_verdict(self, payload):
+                call_id = payload.get('call_id')
+                verdict = payload.get('verdict')  # true / false
+                if call_id is None or verdict is None:
+                    self._json_response({'error': 'call_id and verdict required'}, 400)
+                    return
+
+                fo_file = package_path / 'find_object_history.json'
+                history = self._read_json_file(fo_file, [])
+                updated = False
+                for entry in history:
+                    if entry.get('call_id') == call_id:
+                        entry['verdict'] = bool(verdict)
+                        updated = True
+                        break
+                if updated:
+                    self._write_json_file(fo_file, history)
+                    self._json_response({'ok': True})
+                else:
+                    self._json_response({'error': f'call_id {call_id} not found'}, 404)
+
+            def log_message(self, fmt, *args):
+                pass  # suppress HTTP access log noise
+
+        def _parse_find_object_response(output, label, call_id, timestamp):
+            """Parse ros2 service call CLI output into a dict."""
+            import re
+            entry = {
+                'call_id': call_id, 'timestamp': timestamp,
+                'label_searched': label, 'success': False,
+                'message': output.strip()[:500],
+                'object_id': '', 'bbox': [], 'confidence': 0.0,
+                'x': 0.0, 'y': 0.0, 'z': 0.0, 'theta': 0.0,
+                'verdict': None,
+            }
+            try:
+                # success field
+                m = re.search(r'success=(\w+)', output)
+                if m:
+                    entry['success'] = m.group(1).lower() == 'true'
+                # message field
+                m = re.search(r"message='([^']*)'", output)
+                if m:
+                    entry['message'] = m.group(1)
+                # object_id
+                m = re.search(r"object_id='([^']*)'", output)
+                if m:
+                    entry['object_id'] = m.group(1)
+                # bbox
+                m = re.search(r'bbox=\[([^\]]*)\]', output)
+                if m:
+                    try:
+                        entry['bbox'] = [int(x.strip()) for x in m.group(1).split(',') if x.strip()]
+                    except Exception:
+                        pass
+                # confidence
+                m = re.search(r'confidence=([\d.]+)', output)
+                if m:
+                    entry['confidence'] = float(m.group(1))
+                # x, y, z, theta
+                for field in ('x', 'y', 'z', 'theta'):
+                    m = re.search(rf'{field}=([-\d.]+)', output)
+                    if m:
+                        entry[field] = float(m.group(1))
+            except Exception as e:
+                node_logger.warn(f'Response parse error: {e}')
+            return entry
+
         # Create handler with dashboard_node reference
         def handler_with_node(*args, **kwargs):
             return DashboardHandler(*args, dashboard_node=self, **kwargs)
-        
+
         # Start server in separate thread
         server = HTTPServer(('0.0.0.0', 8080), handler_with_node)
         server_thread = threading.Thread(target=server.serve_forever, daemon=True)
         server_thread.start()
-        
+
         self.get_logger().info(f'HTTP server started on http://localhost:8080')
+        self.get_logger().info(f'Find Object page: http://localhost:8080/find_object.html')
         self.get_logger().info(f'Serving files from: {html_dir}')
     
     def create_default_html(self, html_file):
diff --git a/vision/clip_classifier.py b/vision/clip_classifier.py
index 897094e..b44e029 100755
--- a/vision/clip_classifier.py
+++ b/vision/clip_classifier.py
@@ -1286,244 +1286,173 @@ def _classify_regions(self, rgb_image: np.ndarray, bboxes: List[List[int]]) -> D
     
     def visualization_callback(self):
         """Display camera feed with classification in OpenCV window"""
-        # Use latest_rgb for real-time display, fallback to captured_frame
         frame_to_display = self.latest_rgb if self.latest_rgb is not None else self.captured_frame
-        
+
         if frame_to_display is None:
-            # Show waiting message
             blank = np.zeros((480, 640, 3), dtype=np.uint8)
-            cv2.putText(
-                blank, 
-                f"Waiting to capture frame from {self.rgb_topic}...", 
-                (50, 240),
-                cv2.FONT_HERSHEY_SIMPLEX, 
-                0.8, 
-                (255, 255, 255), 
-                2
-            )
+            cv2.putText(blank, f"Waiting for {self.rgb_topic}...", (60, 240),
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.6, (160, 160, 160), 1)
             cv2.imshow(self.window_name, blank)
             cv2.waitKey(1)
             return
-        
-        # Create visualization image from latest live frame
+
         vis_image = frame_to_display.copy()
         h, w = vis_image.shape[:2]
-        
-        # Check if we have region classifications (from SAM auto-classification)
+
+        # ── Helpers ──────────────────────────────────────────────────────────
+        COLORS = [
+            (0,  200, 255),   # amber
+            (80, 255,  80),   # lime
+            (255,  80,  80),  # blue
+            (255,   0, 200),  # magenta
+            (0,  230, 230),   # yellow
+            (200,  80, 255),  # violet
+            (0,  255, 180),   # spring green
+            (255, 180,   0),  # sky blue
+        ]
+        FOUND_COLOR = (60, 230, 60)   # bright green for "found" object
+
+        def semi_rect(img, x1, y1, x2, y2, fill=(15, 15, 15), alpha=0.75):
+            x1, y1 = max(0, x1), max(0, y1)
+            x2, y2 = min(img.shape[1]-1, x2), min(img.shape[0]-1, y2)
+            if x2 <= x1 or y2 <= y1:
+                return
+            roi = img[y1:y2, x1:x2]
+            img[y1:y2, x1:x2] = cv2.addWeighted(roi, 1-alpha, np.full_like(roi, fill), alpha, 0)
+
+        def corner_bracket(img, x1, y1, x2, y2, color, lw=2):
+            clen = max(10, int(min(x2-x1, y2-y1) * 0.15))
+            for (px, py, dx, dy) in [(x1,y1,1,1),(x2,y1,-1,1),(x1,y2,1,-1),(x2,y2,-1,-1)]:
+                cv2.line(img, (px, py), (px + dx*clen, py), color, lw)
+                cv2.line(img, (px, py), (px, py + dy*clen), color, lw)
+
+        def draw_label(img, text, x, y, color, fs=0.36, ft=1, pad=4, accent=3):
+            """Draw a semi-transparent dark label with a color accent bar."""
+            (lw_px, lh_px), _ = cv2.getTextSize(text, cv2.FONT_HERSHEY_SIMPLEX, fs, ft)
+            bx1, by1 = x, y - lh_px - pad
+            bx2, by2 = x + accent + pad + lw_px + pad, y + pad
+            semi_rect(img, bx1, by1, bx2, by2)
+            cv2.rectangle(img, (max(0,bx1), max(0,by1)), (max(0,bx1)+accent, max(0,by2)), color, -1)
+            cv2.putText(img, text, (bx1 + accent + pad, y),
+                        cv2.FONT_HERSHEY_SIMPLEX, fs, (235, 235, 235), ft)
+
+        # ── Region classifications (SAM + CLIP pipeline) ──────────────────
         if self.latest_region_classifications:
-            # Draw each classified region with bounding box and label
-            for region in self.latest_region_classifications:
-                bbox = region['bbox']
-                top_pred = region['top_prediction']
+            for ri, region in enumerate(self.latest_region_classifications):
+                bbox      = region['bbox']
+                top_pred  = region['top_prediction']
                 region_id = region['region_id']
-                
-                # Draw bounding box
-                cv2.rectangle(
-                    vis_image,
-                    (bbox[0], bbox[1]),
-                    (bbox[2], bbox[3]),
-                    (0, 255, 255),  # Yellow for classified regions
-                    3
-                )
-                
-                # Prepare label text
-                label = f"#{region_id}: {top_pred['label']}"
-                conf = f"{top_pred['confidence']:.1%}"
-                
-                # Calculate label position (above bbox)
-                label_size, _ = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.7, 2)
-                
-                # Draw label background
-                cv2.rectangle(
-                    vis_image,
-                    (bbox[0], bbox[1] - label_size[1] - 25),
-                    (bbox[0] + max(label_size[0], 100), bbox[1]),
-                    (0, 255, 255),
-                    -1
-                )
-                
-                # Draw label text
-                cv2.putText(
-                    vis_image,
-                    label,
-                    (bbox[0] + 5, bbox[1] - 10),
-                    cv2.FONT_HERSHEY_SIMPLEX,
-                    0.7,
-                    (0, 0, 0),
-                    2
-                )
-                
-                # Draw confidence
-                cv2.putText(
-                    vis_image,
-                    conf,
-                    (bbox[0] + 5, bbox[1] - 30),
-                    cv2.FONT_HERSHEY_SIMPLEX,
-                    0.6,
-                    (0, 0, 0),
-                    2
-                )
-            
-            # Add info text
-            info_text = f"Classified Regions: {len(self.latest_region_classifications)}"
-            cv2.putText(
-                vis_image,
-                info_text,
-                (10, 30),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                0.8,
-                (0, 255, 255),
-                2
-            )
-            
-        # Draw full image classification overlay (if available and no regions)
+                color     = COLORS[ri % len(COLORS)]
+                x1, y1, x2, y2 = bbox
+
+                # Corner-bracket bbox + thin outline
+                cv2.rectangle(vis_image, (x1, y1), (x2, y2), color, 1)
+                corner_bracket(vis_image, x1, y1, x2, y2, color, lw=2)
+
+                # Label: "#id  class  conf%"
+                conf_pct = top_pred['confidence']
+                label = f"#{region_id}  {top_pred['label']}  {conf_pct:.0%}"
+
+                # Place above bbox, clamp to image top
+                ly = y1 - 5
+                if ly < 16:
+                    ly = y2 + 16
+                draw_label(vis_image, label, x1, ly, color)
+
+                # Confidence bar under bbox top edge
+                bar_w = x2 - x1
+                filled = max(2, int(bar_w * conf_pct))
+                cv2.rectangle(vis_image, (x1, y1), (x1 + bar_w, y1 + 3), (40, 40, 40), -1)
+                cv2.rectangle(vis_image, (x1, y1), (x1 + filled, y1 + 3), color, -1)
+
+        # ── Full-image classification (no regions) ────────────────────────
         elif self.latest_classification:
-            top_pred = self.latest_classification['output']['top_prediction']
-            all_preds = self.latest_classification['output']['all_predictions'][:5]  # Top 5
-            
-            # Draw semi-transparent overlay at bottom
-            overlay = vis_image.copy()
-            cv2.rectangle(overlay, (0, h-150), (w, h), (0, 0, 0), -1)
-            vis_image = cv2.addWeighted(vis_image, 0.7, overlay, 0.3, 0)
-            
-            # Draw top prediction (large)
-            label_text = f"Top: {top_pred['label']}"
-            conf_text = f"{top_pred['confidence']:.1%}"
-            
-            cv2.putText(
-                vis_image,
-                label_text,
-                (20, h-100),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                1.2,
-                (0, 255, 0),
-                3
-            )
-            
-            cv2.putText(
-                vis_image,
-                conf_text,
-                (20, h-60),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                1.0,
-                (0, 255, 0),
-                2
-            )
-            
-            # Draw top 5 predictions (smaller, on right)
-            y_offset = h - 120
+            top_pred  = self.latest_classification['output']['top_prediction']
+            all_preds = self.latest_classification['output']['all_predictions'][:5]
+
+            # Bottom panel
+            panel_h = 110
+            semi_rect(vis_image, 0, h - panel_h, w, h, fill=(12, 12, 12), alpha=0.80)
+
+            # Top prediction
+            top_label = f"{top_pred['label']}"
+            top_conf  = f"{top_pred['confidence']:.1%}"
+            cv2.putText(vis_image, top_label, (14, h - panel_h + 26),
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.65, (80, 255, 80), 1)
+            cv2.putText(vis_image, top_conf, (14, h - panel_h + 46),
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.42, (160, 255, 160), 1)
+
+            # Confidence bar for top prediction
+            bar_max = min(w // 2 - 20, 260)
+            filled  = int(bar_max * top_pred['confidence'])
+            cv2.rectangle(vis_image, (14, h - panel_h + 52), (14 + bar_max, h - panel_h + 56), (50, 50, 50), -1)
+            cv2.rectangle(vis_image, (14, h - panel_h + 52), (14 + filled, h - panel_h + 56), (80, 255, 80), -1)
+
+            # Top-5 list on the right
+            col_x = w - 230
+            cv2.putText(vis_image, "Top 5", (col_x, h - panel_h + 18),
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.38, (140, 140, 140), 1)
             for i, pred in enumerate(all_preds):
-                text = f"{i+1}. {pred['label']}: {pred['confidence']:.1%}"
-                cv2.putText(
-                    vis_image,
-                    text,
-                    (w - 350, y_offset + i*30),
-                    cv2.FONT_HERSHEY_SIMPLEX,
-                    0.6,
-                    (255, 255, 255),
-                    2
-                )
+                row_text  = f"{i+1}. {pred['label']}"
+                row_conf  = f"{pred['confidence']:.0%}"
+                row_y     = h - panel_h + 34 + i * 16
+                row_color = (200, 200, 200) if i > 0 else (80, 255, 80)
+                cv2.putText(vis_image, row_text, (col_x, row_y),
+                            cv2.FONT_HERSHEY_SIMPLEX, 0.34, row_color, 1)
+                cv2.putText(vis_image, row_conf, (w - 42, row_y),
+                            cv2.FONT_HERSHEY_SIMPLEX, 0.34, row_color, 1)
+
         else:
-            # Show "Call service to classify" message
-            cv2.putText(
-                vis_image,
-                "Call /vision/classify_all or /vision/classify_bb",
-                (20, h-30),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                0.7,
-                (255, 255, 255),
-                2
-            )
-        
-        # Draw found object highlight (if available)
+            # Idle hint at bottom
+            hint = "Run /vision/classify_all or /vision/classify_bb"
+            semi_rect(vis_image, 0, h - 24, w, h, fill=(12, 12, 12), alpha=0.70)
+            cv2.putText(vis_image, hint, (8, h - 8),
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.38, (130, 130, 130), 1)
+
+        # ── Found-object highlight ────────────────────────────────────────
         if self.latest_found_object:
             found = self.latest_found_object
-            bbox = found['bbox']
-            
-            # Draw thick green bounding box for found object
-            cv2.rectangle(
-                vis_image,
-                (bbox[0], bbox[1]),
-                (bbox[2], bbox[3]),
-                (0, 255, 0),  # Green for found object
-                5
-            )
-            
-            # Prepare label text
-            label = f"FOUND: {found['label']}"
-            conf = f"Conf: {found['confidence']:.2f}"
-            
-            # Calculate label position (above bbox)
-            label_size, _ = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.9, 2)
-            
-            # Draw label background (green)
-            cv2.rectangle(
-                vis_image,
-                (bbox[0], bbox[1] - label_size[1] - 35),
-                (bbox[0] + max(label_size[0], 150), bbox[1]),
-                (0, 255, 0),
-                -1
-            )
-            
-            # Draw label text
-            cv2.putText(
-                vis_image,
-                label,
-                (bbox[0] + 5, bbox[1] - 15),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                0.9,
-                (0, 0, 0),
-                2
-            )
-            
-            # Draw confidence
-            cv2.putText(
-                vis_image,
-                conf,
-                (bbox[0] + 5, bbox[1] - 40),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                0.7,
-                (0, 0, 0),
-                2
-            )
-            
-            # Add corner markers
-            corner_size = 15
-            # Top-left
-            cv2.line(vis_image, (bbox[0], bbox[1]), (bbox[0] + corner_size, bbox[1]), (0, 255, 0), 5)
-            cv2.line(vis_image, (bbox[0], bbox[1]), (bbox[0], bbox[1] + corner_size), (0, 255, 0), 5)
-            # Top-right
-            cv2.line(vis_image, (bbox[2], bbox[1]), (bbox[2] - corner_size, bbox[1]), (0, 255, 0), 5)
-            cv2.line(vis_image, (bbox[2], bbox[1]), (bbox[2], bbox[1] + corner_size), (0, 255, 0), 5)
-            # Bottom-left
-            cv2.line(vis_image, (bbox[0], bbox[3]), (bbox[0] + corner_size, bbox[3]), (0, 255, 0), 5)
-            cv2.line(vis_image, (bbox[0], bbox[3]), (bbox[0], bbox[3] - corner_size), (0, 255, 0), 5)
-            # Bottom-right
-            cv2.line(vis_image, (bbox[2], bbox[3]), (bbox[2] - corner_size, bbox[3]), (0, 255, 0), 5)
-            cv2.line(vis_image, (bbox[2], bbox[3]), (bbox[2], bbox[3] - corner_size), (0, 255, 0), 5)
-        
-        # Add title bar
-        cv2.putText(
-            vis_image,
-            f"CLIP Classifier | Frame: {self.frame_counter}",
-            (10, 30),
-            cv2.FONT_HERSHEY_SIMPLEX,
-            0.7,
-            (0, 0, 0),
-            4
-        )
-        
-        cv2.putText(
-            vis_image,
-            f"CLIP Classifier | Frame: {self.frame_counter}",
-            (10, 30),
-            cv2.FONT_HERSHEY_SIMPLEX,
-            0.7,
-            (255, 255, 255),
-            2
-        )
-        
-        # Show image
+            bbox  = found['bbox']
+            x1, y1, x2, y2 = bbox
+            conf  = found['confidence']
+
+            # Pulsing-style: thin outline + thick corner brackets
+            cv2.rectangle(vis_image, (x1, y1), (x2, y2), FOUND_COLOR, 1)
+            clen = max(16, int(min(x2-x1, y2-y1) * 0.18))
+            for (px, py, dx, dy) in [(x1,y1,1,1),(x2,y1,-1,1),(x1,y2,1,-1),(x2,y2,-1,-1)]:
+                cv2.line(vis_image, (px, py), (px + dx*clen, py), FOUND_COLOR, 3)
+                cv2.line(vis_image, (px, py), (px, py + dy*clen), FOUND_COLOR, 3)
+
+            # Center dot
+            cx, cy = (x1+x2)//2, (y1+y2)//2
+            cv2.circle(vis_image, (cx, cy), 5, (15, 15, 15), -1)
+            cv2.circle(vis_image, (cx, cy), 5, FOUND_COLOR, 2)
+            cv2.circle(vis_image, (cx, cy), 2, (240, 240, 240), -1)
+
+            # Label + confidence bar
+            label = f"FOUND  {found['label']}  {conf:.0%}"
+            ly = y1 - 5
+            if ly < 16:
+                ly = y2 + 16
+            draw_label(vis_image, label, x1, ly, FOUND_COLOR, fs=0.40, pad=5, accent=4)
+
+            bar_w  = x2 - x1
+            filled = max(2, int(bar_w * conf))
+            cv2.rectangle(vis_image, (x1, y2 - 4), (x1 + bar_w, y2), (40, 40, 40), -1)
+            cv2.rectangle(vis_image, (x1, y2 - 4), (x1 + filled, y2), FOUND_COLOR, -1)
+
+        # ── Top info bar ──────────────────────────────────────────────────
+        bar_h = 22
+        semi_rect(vis_image, 0, 0, w, bar_h, fill=(12, 12, 12), alpha=0.78)
+        if self.latest_region_classifications:
+            status = f"CLIP  |  Regions: {len(self.latest_region_classifications)}  |  Frame: {self.frame_counter}"
+        elif self.latest_classification:
+            status = f"CLIP  |  Full-image mode  |  Frame: {self.frame_counter}"
+        else:
+            status = f"CLIP Classifier  |  Frame: {self.frame_counter}  |  Idle"
+        cv2.putText(vis_image, status, (8, 15),
+                    cv2.FONT_HERSHEY_SIMPLEX, 0.42, (210, 210, 210), 1)
+
         cv2.imshow(self.window_name, vis_image)
         cv2.waitKey(1)
     
diff --git a/vision/find_object_service_node.py b/vision/find_object_service_node.py
index ba31db3..31ec056 100644
--- a/vision/find_object_service_node.py
+++ b/vision/find_object_service_node.py
@@ -5,9 +5,6 @@
 from rclpy.callback_groups import ReentrantCallbackGroup
 from rclpy.executors import MultiThreadedExecutor
 from custom_interfaces.srv import DetectObjects, FindObject, PixelToReal, FindObjectReal, FindObjectAngleBB, FindMultiObjectReal, FindMultiObject
-
-
-
 """
 ros2 service call /find_object custom_interfaces/srv/FindObjectReal "{label: 'bowl'}"
 
@@ -77,7 +74,7 @@ def __init__(self):
         )
         
         self.get_logger().info('Find Object Service Node initialized')
-        
+
         # Wait for services to be available
         self.wait_for_services()
     
@@ -102,6 +99,43 @@ def wait_for_services(self):
         
         self.get_logger().info('Service clients ready')
     
+    def _log_find_object_call(self, label, response):
+        """Append a /find_object call result to find_object_history.json for the dashboard."""
+        try:
+            with self._history_lock:
+                history = []
+                if self._history_file.exists():
+                    try:
+                        with open(self._history_file, 'r') as f:
+                            history = json.load(f)
+                        if not isinstance(history, list):
+                            history = []
+                    except Exception:
+                        history = []
+
+                call_id = len(history) + 1
+                entry = {
+                    'call_id': call_id,
+                    'timestamp': datetime.now().isoformat(),
+                    'label_searched': label,
+                    'success': bool(response.success),
+                    'message': response.message,
+                    'object_id': response.object_id,
+                    'bbox': [int(v) for v in response.bbox] if response.bbox else [],
+                    'confidence': float(response.confidence),
+                    'x': float(response.x),
+                    'y': float(response.y),
+                    'z': float(response.z),
+                    'theta': float(response.theta),
+                    'verdict': None,
+                }
+                history.append(entry)
+                history = history[-50:]  # keep last 50
+                with open(self._history_file, 'w') as f:
+                    json.dump(history, f, indent=2)
+        except Exception as e:
+            self.get_logger().warn(f'Failed to log find_object call: {e}')
+
     def find_object_callback(self, request, response):
         """
         Main service callback for /find_object
@@ -266,7 +300,8 @@ def find_object_callback(self, request, response):
             response.y = 0.0
             response.z = 0.0
             response.theta = 0.0
-        
+
+        self._log_find_object_call(label, response)
         return response
 
 
diff --git a/vision/obb_angle_service_node.py b/vision/obb_angle_service_node.py
index 41b36cd..649ee0b 100644
--- a/vision/obb_angle_service_node.py
+++ b/vision/obb_angle_service_node.py
@@ -401,149 +401,165 @@ def visualize_obb(self, results, mode="auto"):
         """
         if self.latest_rgb_image is None:
             self.get_logger().warn('No RGB image available for visualization')
-            # Show a blank placeholder window
-            blank = np.zeros((800, 1200, 3), dtype=np.uint8)
-            cv2.putText(blank, "Waiting for RGB camera image...", 
-                       (300, 400), cv2.FONT_HERSHEY_SIMPLEX, 1.5, (255, 255, 255), 3)
-            cv2.putText(blank, f"RGB Topic: {self.rgb_topic}", 
-                       (350, 450), cv2.FONT_HERSHEY_SIMPLEX, 0.8, (128, 128, 128), 2)
+            blank = np.zeros((480, 640, 3), dtype=np.uint8)
+            cv2.putText(blank, "Waiting for RGB camera...", (80, 230),
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.65, (160, 160, 160), 1)
+            cv2.putText(blank, self.rgb_topic, (80, 258),
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.42, (100, 100, 100), 1)
             cv2.imshow(self.window_name, blank)
             cv2.waitKey(1)
             return
-        
+
         vis_image = self.latest_rgb_image.copy()
-        
+        img_h, img_w = vis_image.shape[:2]
+
         # Auto-detect mode
         if mode == "auto":
             mode = "single" if len(results) == 1 else "multi"
-        
-        # Color palette for objects
-        colors = [
-            (255, 255, 0),   # Cyan
-            (255, 0, 255),   # Magenta
-            (0, 255, 255),   # Yellow
-            (255, 128, 0),   # Orange
-            (128, 255, 0),   # Lime
-            (0, 255, 128),   # Spring Green
-            (255, 0, 128),   # Pink
-            (128, 0, 255),   # Purple
+
+        # Distinct color palette (BGR)
+        COLORS = [
+            (0,  200, 255),   # amber
+            (80, 255,  80),   # lime
+            (255,  80,  80),  # blue
+            (255,   0, 200),  # magenta
+            (0,  230, 230),   # yellow
+            (200,  80, 255),  # violet
+            (0,  255, 180),   # spring green
+            (255, 180,   0),  # sky blue
         ]
-        
-        # Process each OBB
+
+        def draw_corner_bracket(img, pts, color, lw=2):
+            """Draw corner-bracket accents on an OBB polygon."""
+            n = len(pts)
+            for i in range(n):
+                A = pts[(i - 1) % n].astype(float)
+                B = pts[i].astype(float)
+                C = pts[(i + 1) % n].astype(float)
+                ab = A - B;  ab_len = np.linalg.norm(ab)
+                cb = C - B;  cb_len = np.linalg.norm(cb)
+                if ab_len == 0 or cb_len == 0:
+                    continue
+                clen = max(10, int(min(ab_len, cb_len) * 0.22))
+                p1 = (B + (ab / ab_len) * clen).astype(int)
+                p2 = (B + (cb / cb_len) * clen).astype(int)
+                cv2.line(img, tuple(B.astype(int)), tuple(p1), color, lw)
+                cv2.line(img, tuple(B.astype(int)), tuple(p2), color, lw)
+
+        def semi_transparent_rect(img, x1, y1, x2, y2, fill, alpha=0.72):
+            """Blend a dark rectangle over a sub-region."""
+            x1 = max(0, x1);  y1 = max(0, y1)
+            x2 = min(img.shape[1] - 1, x2);  y2 = min(img.shape[0] - 1, y2)
+            if x2 <= x1 or y2 <= y1:
+                return
+            roi = img[y1:y2, x1:x2]
+            bg  = np.full_like(roi, fill)
+            img[y1:y2, x1:x2] = cv2.addWeighted(roi, 1 - alpha, bg, alpha, 0)
+
+        # ── Process each OBB ─────────────────────────────────────────────────
         for idx, result_tuple in enumerate(results):
-            # Unpack (handle optional bbox)
             if len(result_tuple) == 7:
                 object_id, u, v, theta, width, height, bbox = result_tuple
             else:
                 object_id, u, v, theta, width, height = result_tuple
                 bbox = None
-            
-            color = colors[idx % len(colors)]
-            
-            # Draw AABB first if provided (for single object mode)
-            if bbox is not None and mode == "single":
-                x1, y1, x2, y2 = bbox
-                cv2.rectangle(vis_image, (int(x1), int(y1)), (int(x2), int(y2)), (0, 255, 0), 2)
-                cv2.putText(vis_image, "Input AABB", (int(x1), int(y1) - 5),
-                           cv2.FONT_HERSHEY_SIMPLEX, 0.6, (0, 255, 0), 2)
-            
-            # Get OBB corner points
-            box_points = self.get_obb_corner_points(u, v, theta, width, height)
-            
-            # Draw OBB
-            cv2.drawContours(vis_image, [box_points], 0, color, 3)
-            
-            # Draw center point
-            if mode == "single":
-                cv2.circle(vis_image, (int(u), int(v)), 8, (0, 0, 255), -1)  # Red center
-                cv2.circle(vis_image, (int(u), int(v)), 10, (255, 255, 255), 2)  # White outline
-            else:
-                cv2.circle(vis_image, (int(u), int(v)), 6, (255, 255, 255), -1)
-                cv2.circle(vis_image, (int(u), int(v)), 8, color, 2)
-            
-            # Draw angle arrow perpendicular to WIDTH (shorter dimension), with -90° offset so 0° points UP
-            arrow_length = height   # Use height (shorter dimension) for arrow length
-            # Arrow perpendicular to width = add 90° to theta, then -90° for visualization
-            visual_theta = theta + np.pi / 2 - np.pi / 2  # Perpendicular, then visualization offset
-            end_x = int(u + arrow_length * np.cos(visual_theta))
-            end_y = int(v + arrow_length * np.sin(visual_theta))
-            arrow_thickness = 3 if mode == "single" else 2
-            cv2.arrowedLine(vis_image, (int(u), int(v)), (end_x, end_y), 
-                          (255, 0, 255) if mode == "single" else color, 
-                          arrow_thickness, tipLength=0.3)
-            
-            # Draw label (use remapped angle: 90deg - original geometry angle)
+
+            color = COLORS[idx % len(COLORS)]
+            cx, cy = int(u), int(v)
             angle_geom_deg = np.rad2deg(theta)
             angle_deg = 90.0 - angle_geom_deg
-            
+
+            # ── Input AABB (single mode only) ─────────────────────────────
+            if bbox is not None and mode == "single":
+                ax1, ay1, ax2, ay2 = int(bbox[0]), int(bbox[1]), int(bbox[2]), int(bbox[3])
+                # Dashed-style thin rectangle (draw as corner brackets only)
+                aabb_pts = np.array([[ax1,ay1],[ax2,ay1],[ax2,ay2],[ax1,ay2]])
+                draw_corner_bracket(vis_image, aabb_pts, (80, 200, 80), lw=1)
+                cv2.rectangle(vis_image, (ax1, ay1), (ax2, ay2), (80, 200, 80), 1)
+                # Small label
+                ts, _ = cv2.getTextSize("AABB", cv2.FONT_HERSHEY_SIMPLEX, 0.33, 1)
+                semi_transparent_rect(vis_image, ax1, ay1 - ts[1] - 6, ax1 + ts[0] + 4, ay1, (18, 18, 18))
+                cv2.putText(vis_image, "AABB", (ax1 + 2, ay1 - 3),
+                            cv2.FONT_HERSHEY_SIMPLEX, 0.33, (80, 200, 80), 1)
+
+            # ── OBB outline ───────────────────────────────────────────────
+            box_pts = self.get_obb_corner_points(u, v, theta, width, height)
+            # Thin full outline
+            cv2.drawContours(vis_image, [box_pts], 0, color, 1)
+            # Corner bracket accents
+            draw_corner_bracket(vis_image, box_pts, color, lw=2)
+
+            # ── Center dot ────────────────────────────────────────────────
+            cv2.circle(vis_image, (cx, cy), 5, (15, 15, 15), -1)   # dark fill
+            cv2.circle(vis_image, (cx, cy), 5, color, 2)            # color ring
+            cv2.circle(vis_image, (cx, cy), 2, (240, 240, 240), -1) # white center
+
+            # ── Angle arrow ───────────────────────────────────────────────
+            visual_theta = theta + np.pi / 2 - np.pi / 2
+            arrow_len = int(max(height * 0.55, 20))
+            end_x = int(cx + arrow_len * np.cos(visual_theta))
+            end_y = int(cy + arrow_len * np.sin(visual_theta))
+            cv2.arrowedLine(vis_image, (cx, cy), (end_x, end_y),
+                            color, 2, tipLength=0.35)
+
+            # ── Info panel (single) / compact label (multi) ───────────────
             if mode == "single":
-                # Concise info box for single object
                 info_lines = [
                     f"{object_id}",
-                    f"Center: ({int(u)}, {int(v)})",
-                    f"Angle: {angle_deg:.1f}deg",
-                    f"Size: {width:.0f}x{height:.0f}"
+                    f"Center  ({cx}, {cy})",
+                    f"Angle   {angle_deg:.1f} deg",
+                    f"Size    {width:.0f} x {height:.0f} px",
                 ]
-                
-                # Draw compact info box at top-right
-                font_scale = 0.6
-                font_thickness = 2
-                line_spacing = 25
-                
-                max_width = 0
-                for line in info_lines:
-                    (text_w, text_h), _ = cv2.getTextSize(line, cv2.FONT_HERSHEY_SIMPLEX, 
-                                                          font_scale, font_thickness)
-                    max_width = max(max_width, text_w)
-                
-                box_height = len(info_lines) * line_spacing + 15
-                box_x = vis_image.shape[1] - max_width - 25
-                box_y = 15
-                
-                # Background with transparency effect
-                overlay = vis_image.copy()
-                cv2.rectangle(overlay, (box_x - 8, box_y - 8),
-                            (box_x + max_width + 8, box_y + box_height), (0, 0, 0), -1)
-                cv2.addWeighted(overlay, 0.7, vis_image, 0.3, 0, vis_image)
-                
+                fs, ft = 0.42, 1
+                pad = 8
+                line_h = 20
+                max_w = max(cv2.getTextSize(l, cv2.FONT_HERSHEY_SIMPLEX, fs, ft)[0][0]
+                            for l in info_lines)
+                panel_w = max_w + pad * 2 + 4   # +4 for accent bar
+                panel_h = len(info_lines) * line_h + pad
+                px = img_w - panel_w - 10
+                py = 28   # sits below top bar
+
+                # Background
+                semi_transparent_rect(vis_image, px - 2, py, px + panel_w, py + panel_h, (15, 15, 15))
+                # Left accent bar
+                cv2.rectangle(vis_image, (px - 2, py), (px + 2, py + panel_h), color, -1)
                 # Border
-                cv2.rectangle(vis_image, (box_x - 8, box_y - 8),
-                            (box_x + max_width + 8, box_y + box_height), color, 2)
-                
-                # Text lines
+                cv2.rectangle(vis_image, (px - 2, py), (px + panel_w, py + panel_h), color, 1)
+
                 for i, line in enumerate(info_lines):
-                    y_pos = box_y + (i * line_spacing) + 18
-                    cv2.putText(vis_image, line, (box_x, y_pos),
-                              cv2.FONT_HERSHEY_SIMPLEX, font_scale, color, font_thickness)
+                    ty = py + pad + i * line_h + line_h // 2
+                    # Dim the label for the first line (object id) — draw in color
+                    text_color = color if i == 0 else (210, 210, 210)
+                    cv2.putText(vis_image, line, (px + 6, ty),
+                                cv2.FONT_HERSHEY_SIMPLEX, fs, text_color, ft)
             else:
-                # Compact label for multi-object
-                label = f"#{idx} {angle_deg:.1f}deg"
-                label_x = int(u + 15)
-                label_y = int(v)
-                
-                # Text with outline
-                cv2.putText(vis_image, label, (label_x, label_y),
-                           cv2.FONT_HERSHEY_SIMPLEX, 0.7, (0, 0, 0), 5)
-                cv2.putText(vis_image, label, (label_x, label_y),
-                           cv2.FONT_HERSHEY_SIMPLEX, 0.7, color, 2)
-        
-        # Add concise title
-        if mode == "single":
-            title = "OBB Detection"
-        else:
-            title = f"OBB Detection ({len(results)} objects)"
-        
-        cv2.putText(vis_image, title, (10, 35), cv2.FONT_HERSHEY_SIMPLEX, 1.0, (255, 255, 255), 3)
-        cv2.putText(vis_image, title, (10, 35), cv2.FONT_HERSHEY_SIMPLEX, 1.0, (0, 255, 255), 2)
-        
-        # Add concise legend at bottom
-        legend_y = vis_image.shape[0] - 20
-        legend_text = "0deg = Vertical | Range: -90deg to +90deg"
-        
-        cv2.putText(vis_image, legend_text, (10, legend_y),
-                   cv2.FONT_HERSHEY_SIMPLEX, 0.5, (255, 255, 255), 2)
-        
-        # Display
+                # Compact floating label near center
+                label = f"#{idx}  {angle_deg:.1f}°"
+                fs, ft = 0.38, 1
+                (lw_px, lh_px), _ = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, fs, ft)
+                pad = 4
+                lx = cx + 12
+                ly = cy - 6
+                # Clamp
+                lx = min(lx, img_w - lw_px - pad * 2 - 5)
+                ly = max(ly, lh_px + pad + 2)
+
+                semi_transparent_rect(vis_image, lx - 2, ly - lh_px - pad,
+                                      lx + lw_px + pad * 2 + 3, ly + pad, (15, 15, 15))
+                cv2.rectangle(vis_image, (lx - 2, ly - lh_px - pad),
+                              (lx + 3, ly + pad), color, -1)  # accent bar
+                cv2.putText(vis_image, label, (lx + 5, ly),
+                            cv2.FONT_HERSHEY_SIMPLEX, fs, (230, 230, 230), ft)
+
+        # ── Top info bar ─────────────────────────────────────────────────────
+        bar_h = 24
+        obj_count = len(results)
+        title = f"OBB Detection  |  Objects: {obj_count}  |  0 deg = Vertical"
+        semi_transparent_rect(vis_image, 0, 0, img_w, bar_h, (12, 12, 12), alpha=0.78)
+        cv2.putText(vis_image, title, (8, 16),
+                    cv2.FONT_HERSHEY_SIMPLEX, 0.42, (210, 210, 210), 1)
+
         cv2.imshow(self.window_name, vis_image)
         cv2.waitKey(1)
         
diff --git a/vision/simple_sam_detector.py b/vision/simple_sam_detector.py
index b303d75..fdff486 100755
--- a/vision/simple_sam_detector.py
+++ b/vision/simple_sam_detector.py
@@ -29,7 +29,7 @@
 from rclpy.node import Node
 from rclpy.qos import QoSProfile, QoSReliabilityPolicy, QoSHistoryPolicy
 from custom_interfaces.msg import SAMDetections, SAMDetection
-from custom_interfaces.srv import DetectObjects
+from custom_interfaces.srv import DetectObjects, FindObjectAngle, PixelToReal
 from sensor_msgs.msg import Image
 from std_srvs.srv import Trigger
 from std_msgs.msg import Header
@@ -165,7 +165,25 @@ def __init__(self, single_shot_mode=False):
             Trigger,
             '/vision/classify_bbox_filtered'
         )
-        
+
+        # Service client for GraspNet detection
+        self.grasp_client = self.create_client(
+            Trigger,
+            '/vision/detect_grasp'
+        )
+
+        # Service client for OBB angle detection
+        self.obb_client = self.create_client(
+            FindObjectAngle,
+            '/obb/find_object_angle'
+        )
+
+        # Service client for pixel-to-real conversion
+        self.pixel_to_real_client = self.create_client(
+            PixelToReal,
+            '/pixel_to_real'
+        )
+
         # OpenCV window setup
         self.window_name = f"SAM Object Detection - {self.rgb_topic}"
         cv2.namedWindow(self.window_name, cv2.WINDOW_NORMAL)
@@ -240,11 +258,13 @@ def depth_callback(self, msg: Image):
             self.get_logger().error(f"Failed to convert depth image: {e}")
     
     def run_pipeline_callback(self, request, response):
-        """Service callback for /vision/run_pipeline - triggers detection and publishes to topic"""
+        """Service callback for /vision/run_pipeline - runs SAM+CLIP+GraspNet+OBB+Pixel-to-Real"""
+        import time
+        pipeline_start = time.perf_counter()
+
         try:
-            # Use captured frame instead of latest_rgb for consistency
             frame_to_use = self.captured_frame if self.frame_captured else self.latest_rgb
-            
+
             if frame_to_use is None:
                 response.success = False
                 response.message = json.dumps({
@@ -254,53 +274,207 @@ def run_pipeline_callback(self, request, response):
                 }, indent=2)
                 self.get_logger().warn("No image received yet")
                 return response
-            
+
             self.get_logger().info("=" * 80)
-            self.get_logger().info("Running SAM detection on captured frame...")
-            self.get_logger().info(f"Frame shape: {frame_to_use.shape}")
+            self.get_logger().info("Running full pipeline: SAM + CLIP + GraspNet + OBB + Pixel-to-Real")
             self.get_logger().info("=" * 80)
-            
-            # Run detection on captured frame (with IoU tracking from previous frame)
+
+            # ── Step 1: SAM detection ──────────────────────────────────────────
+            sam_start = time.perf_counter()
             self.latest_detections = self._detect_objects(frame_to_use)
-            
-            # Store current detections as previous for next frame IoU calculation
             self.previous_detections = self.latest_detections.copy()
-            
-            # Build JSON response in the requested schema
-            detection_data = self._build_detection_schema()
-            
-            # Publish detections as ROS2 message
             self._publish_detections_ros()
-            
-            response.success = True
-            response.message = json.dumps(detection_data, indent=2)
-            
-            self.get_logger().info("=" * 80)
-            self.get_logger().info(f"Detection complete: {len(self.latest_detections)} objects found")
-            self.get_logger().info("=" * 80)
-            
-            # Print JSON output with bounding boxes
-            self.get_logger().info("JSON OUTPUT (with bounding boxes):")
-            self.get_logger().info("=" * 80)
-            self.get_logger().info(response.message)
-            self.get_logger().info("=" * 80)
-            
-            # Print detection details in readable format
-            self.get_logger().info("Bounding Boxes Summary:")
-            for i, det in enumerate(self.latest_detections):
+            sam_latency = time.perf_counter() - sam_start
+            self.get_logger().info(f"[1/5] SAM: {len(self.latest_detections)} objects in {sam_latency:.3f}s")
+
+            # ── Step 2: CLIP classification ────────────────────────────────────
+            time.sleep(0.3)  # allow CLIP to process published detections
+            clip_start = time.perf_counter()
+            clip_classifications = {}
+            clip_success = False
+            if self.clip_filter_client.wait_for_service(timeout_sec=2.0):
+                try:
+                    fut = self.clip_filter_client.call_async(Trigger.Request())
+                    rclpy.spin_until_future_complete(self, fut, timeout_sec=5.0)
+                    clip_resp = fut.result()
+                    if clip_resp and clip_resp.success:
+                        clip_json = json.loads(clip_resp.message)
+                        for region in clip_json.get('regions', []):
+                            rid = region.get('region_id')
+                            clip_classifications[rid] = {
+                                'label':      region.get('label'),
+                                'confidence': float(region.get('confidence', 0.0)),
+                            }
+                        clip_success = True
+                except Exception as e:
+                    self.get_logger().warn(f"CLIP call failed: {e}")
+            clip_latency = time.perf_counter() - clip_start
+            self.get_logger().info(f"[2/5] CLIP: {len(clip_classifications)} labelled in {clip_latency:.3f}s")
+
+            # ── Step 3: GraspNet detection ─────────────────────────────────────
+            grasp_start = time.perf_counter()
+            grasp_map = {}
+            grasp_success = False
+            if self.grasp_client.wait_for_service(timeout_sec=2.0):
+                try:
+                    fut = self.grasp_client.call_async(Trigger.Request())
+                    rclpy.spin_until_future_complete(self, fut, timeout_sec=10.0)
+                    grasp_resp = fut.result()
+                    if grasp_resp and grasp_resp.success:
+                        grasp_json = json.loads(grasp_resp.message)
+                        for g in grasp_json.get('grasps', []):
+                            obj_id_str = g.get('object_id', '')
+                            try:
+                                oid = int(obj_id_str.split('_')[1]) if '_' in obj_id_str else int(obj_id_str)
+                            except (ValueError, IndexError):
+                                continue
+                            if oid in grasp_map:
+                                continue
+                            pix = g.get('pixel_location', [0, 0])
+                            pos = g.get('position', {})
+                            grasp_map[oid] = {
+                                'pixel':             {'u': int(pix[0]) if len(pix) > 0 else 0,
+                                                      'v': int(pix[1]) if len(pix) > 1 else 0},
+                                'world':             {'x': float(pos.get('x', 0.0)),
+                                                      'y': float(pos.get('y', 0.0)),
+                                                      'z': float(pos.get('z', 0.0))},
+                                'quality_score':     float(g.get('quality_score', 0.0)),
+                                'grasp_width':       float(g.get('grasp_width', 0.0)),
+                                'approach_direction': g.get('approach_direction', ''),
+                            }
+                        grasp_success = True
+                except Exception as e:
+                    self.get_logger().warn(f"GraspNet call failed: {e}")
+            grasp_latency = time.perf_counter() - grasp_start
+            self.get_logger().info(f"[3/5] GraspNet: {len(grasp_map)} grasps in {grasp_latency:.3f}s")
+
+            # ── Step 4: OBB angle detection ────────────────────────────────────
+            obb_start = time.perf_counter()
+            obb_map = {}
+            obb_success = False
+            if self.obb_client.wait_for_service(timeout_sec=2.0):
+                try:
+                    fut = self.obb_client.call_async(FindObjectAngle.Request())
+                    rclpy.spin_until_future_complete(self, fut, timeout_sec=5.0)
+                    obb_resp = fut.result()
+                    if obb_resp and obb_resp.success:
+                        n_obb = obb_resp.total_objects
+                        bboxes_flat = list(obb_resp.bboxes)
+                        for i in range(n_obb):
+                            bx1 = bboxes_flat[i * 4]     if len(bboxes_flat) > i * 4     else 0
+                            by1 = bboxes_flat[i * 4 + 1] if len(bboxes_flat) > i * 4 + 1 else 0
+                            bx2 = bboxes_flat[i * 4 + 2] if len(bboxes_flat) > i * 4 + 2 else 0
+                            by2 = bboxes_flat[i * 4 + 3] if len(bboxes_flat) > i * 4 + 3 else 0
+                            theta = float(obb_resp.thetas[i]) if i < len(obb_resp.thetas) else 0.0
+                            obb_entry = {
+                                'theta_rad':  theta,
+                                'angle_deg':  float(theta * 180.0 / 3.141592653589793),
+                                'width_px':   float(obb_resp.widths[i])    if i < len(obb_resp.widths)    else 0.0,
+                                'height_px':  float(obb_resp.heights[i])   if i < len(obb_resp.heights)   else 0.0,
+                                'center_u':   float(obb_resp.centers_u[i]) if i < len(obb_resp.centers_u) else 0.0,
+                                'center_v':   float(obb_resp.centers_v[i]) if i < len(obb_resp.centers_v) else 0.0,
+                            }
+                            # Match OBB result to SAM detection by IoU
+                            obb_bbox = [bx1, by1, bx2, by2]
+                            best_iou, best_idx = 0.0, i
+                            for sam_idx, det in enumerate(self.latest_detections):
+                                iou = self._calculate_iou(obb_bbox, det['bbox'])
+                                if iou > best_iou:
+                                    best_iou, best_idx = iou, sam_idx
+                            obb_map[best_idx] = obb_entry
+                        obb_success = True
+                except Exception as e:
+                    self.get_logger().warn(f"OBB call failed: {e}")
+            obb_latency = time.perf_counter() - obb_start
+            self.get_logger().info(f"[4/5] OBB: {len(obb_map)} objects in {obb_latency:.3f}s")
+
+            # ── Step 5: Pixel-to-Real for each detected object center ──────────
+            p2r_start = time.perf_counter()
+            p2r_map = {}
+            p2r_success = False
+            if self.pixel_to_real_client.wait_for_service(timeout_sec=2.0):
+                p2r_success = True
+                for idx, det in enumerate(self.latest_detections):
+                    cx, cy = det['center']
+                    try:
+                        req = PixelToReal.Request()
+                        req.u = int(cx)
+                        req.v = int(cy)
+                        fut = self.pixel_to_real_client.call_async(req)
+                        rclpy.spin_until_future_complete(self, fut, timeout_sec=2.0)
+                        p2r_resp = fut.result()
+                        if p2r_resp:
+                            p2r_map[idx] = {
+                                'u': int(cx), 'v': int(cy),
+                                'x': float(p2r_resp.x),
+                                'y': float(p2r_resp.y),
+                                'z': float(p2r_resp.z),
+                            }
+                    except Exception as e:
+                        self.get_logger().warn(f"Pixel-to-real idx={idx} failed: {e}")
+            p2r_latency = time.perf_counter() - p2r_start
+            self.get_logger().info(f"[5/5] Pixel-to-Real: {len(p2r_map)} objects in {p2r_latency:.3f}s")
+
+            # ── Build unified JSON response ────────────────────────────────────
+            total_latency = time.perf_counter() - pipeline_start
+            objects_out = []
+            for idx, det in enumerate(self.latest_detections):
+                clip_info  = clip_classifications.get(idx, {})
+                grasp_info = grasp_map.get(idx, {})
+                obb_info   = obb_map.get(idx, {})
+                p2r_info   = p2r_map.get(idx, {})
                 bbox = det['bbox']
-                distance = det.get('distance_cm', 'N/A')
-                self.get_logger().info(
-                    f"   [{i}] {det['class_name']}: bbox={bbox}, "
-                    f"confidence={det['confidence']:.2f}, distance={distance}"
-                )
+                objects_out.append({
+                    'object_id':       det['id'],
+                    'label':           clip_info.get('label', '') if clip_info else '',
+                    'bbox':            {'x1': bbox[0], 'y1': bbox[1], 'x2': bbox[2], 'y2': bbox[3]},
+                    'center':          {'u': det['center'][0], 'v': det['center'][1]},
+                    'sam_confidence':  round(float(det['confidence']), 4),
+                    'clip_confidence': round(float(clip_info.get('confidence', 0.0)), 4) if clip_info else '',
+                    'iou_score':       round(float(det.get('iou_score', 0.0)), 4),
+                    'is_stable':       bool(det.get('is_stable', False)),
+                    'distance_cm':     float(det['distance_cm']) if det.get('distance_cm') is not None else '',
+                    'world':           p2r_info if p2r_info else {},
+                    'has_grasp':       bool(grasp_info),
+                    'grasp':           grasp_info if grasp_info else {},
+                    'obb': {
+                        'angle_deg': round(obb_info['angle_deg'], 2),
+                        'theta_rad': round(obb_info['theta_rad'], 4),
+                        'width_px':  round(obb_info['width_px'], 1),
+                        'height_px': round(obb_info['height_px'], 1),
+                        'center_u':  round(obb_info['center_u'], 1),
+                        'center_v':  round(obb_info['center_v'], 1),
+                    } if obb_info else {},
+                })
+
+            pipeline_result = {
+                'pipeline':      'run_pipeline',
+                'timestamp':     datetime.utcnow().isoformat() + 'Z',
+                'total_objects': len(objects_out),
+                'latency_s':     round(total_latency, 3),
+                'services': {
+                    'sam':           {'success': True,          'latency_s': round(sam_latency, 3),   'total_detections': len(self.latest_detections)},
+                    'clip':          {'success': clip_success,   'latency_s': round(clip_latency, 3),  'filtered_regions': len(clip_classifications)},
+                    'graspnet':      {'success': grasp_success,  'latency_s': round(grasp_latency, 3), 'total_grasps': len(grasp_map)},
+                    'obb':           {'success': obb_success,    'latency_s': round(obb_latency, 3),   'total_objects': len(obb_map)},
+                    'pixel_to_real': {'success': p2r_success,   'latency_s': round(p2r_latency, 3),   'total_converted': len(p2r_map)},
+                },
+                'objects': objects_out,
+            }
+
+            # Save to vision_runs_history.json (dashboard reads this)
+            self._save_run_pipeline_result(
+                pipeline_result, clip_classifications, grasp_map, obb_map, p2r_map,
+                sam_latency, clip_latency, grasp_latency, obb_latency
+            )
+
+            response.success = True
+            response.message = json.dumps(pipeline_result, indent=2)
+
             self.get_logger().info("=" * 80)
-            
-            # Verify bounding boxes are in output
-            bbox_count = len([d for d in detection_data.get('detections', [{}])[0].get('detections', []) if 'bbox' in d])
-            self.get_logger().info(f"Verified: {bbox_count} bounding boxes included in JSON output")
+            self.get_logger().info(f"Full pipeline done: {len(objects_out)} objects, {total_latency:.2f}s total")
             self.get_logger().info("=" * 80)
-            
+
         except Exception as e:
             response.success = False
             response.message = json.dumps({
@@ -308,12 +482,119 @@ def run_pipeline_callback(self, request, response):
                 "error": str(e),
                 "timestamp": datetime.utcnow().isoformat() + "Z"
             }, indent=2)
-            self.get_logger().error(f"Detection error: {e}")
+            self.get_logger().error(f"Pipeline error: {e}")
             import traceback
             self.get_logger().error(traceback.format_exc())
-        
+
         return response
 
+    def _save_run_pipeline_result(self, pipeline_result, clip_classifications, grasp_map, obb_map, p2r_map,
+                                   sam_latency, clip_latency, grasp_latency, obb_latency):
+        """Save /vision/run_pipeline results to vision_runs_history.json for the dashboard."""
+        try:
+            from pathlib import Path
+            package_path = Path(__file__).parent.parent
+            history_file = package_path / 'vision_runs_history.json'
+
+            history = []
+            if history_file.exists():
+                try:
+                    with open(history_file, 'r') as f:
+                        data = json.load(f)
+                    if isinstance(data, list):
+                        history = data
+                except Exception:
+                    pass
+
+            last_run_no = history[-1]['meta']['run_no'] if history else 0
+            run_no = last_run_no + 1
+
+            num_dets = len(self.latest_detections)
+            iou_scores = [float(d.get('iou_score', 0.0)) for d in self.latest_detections]
+            is_stable_array = [bool(d.get('is_stable', False)) for d in self.latest_detections]
+            avg_sam_conf = (sum(float(d.get('confidence', 0.0)) for d in self.latest_detections) / num_dets
+                            if num_dets > 0 else 0.0)
+            avg_iou = sum(iou_scores) / len(iou_scores) if iou_scores else 0.0
+            stability_rate = (sum(1 for s in is_stable_array if s) / len(is_stable_array)
+                              if is_stable_array else 0.0)
+
+            objects = []
+            for idx, det in enumerate(self.latest_detections):
+                clip_info  = clip_classifications.get(idx, {})
+                grasp_info = grasp_map.get(idx, {})
+                obb_info   = obb_map.get(idx, {})
+                p2r_info   = p2r_map.get(idx, {})
+                bbox = det['bbox']
+                objects.append({
+                    'object_id':       det['id'],
+                    'label':           clip_info.get('label', '') if clip_info else '',
+                    'bbox_x1':         bbox[0],
+                    'bbox_y1':         bbox[1],
+                    'bbox_x2':         bbox[2],
+                    'bbox_y2':         bbox[3],
+                    'sam_confidence':  round(float(det.get('confidence', 0.0)), 4),
+                    'clip_confidence': round(float(clip_info.get('confidence', 0.0)), 4) if clip_info else '',
+                    'distance_cm':     float(det['distance_cm']) if det.get('distance_cm') is not None else '',
+                    'iou_score':       iou_scores[idx],
+                    'is_stable':       is_stable_array[idx],
+                    'has_grasp':       bool(grasp_info),
+                    'grasp':           grasp_info if grasp_info else {},
+                    'world':           p2r_info if p2r_info else {},
+                    'obb_angle_deg':   round(obb_info['angle_deg'], 2) if obb_info else '',
+                    'obb_theta_rad':   round(obb_info['theta_rad'], 4) if obb_info else '',
+                    'obb_width_px':    round(obb_info['width_px'], 1)  if obb_info else '',
+                    'obb_height_px':   round(obb_info['height_px'], 1) if obb_info else '',
+                    'obb_center_u':    round(obb_info['center_u'], 1)  if obb_info else '',
+                    'obb_center_v':    round(obb_info['center_v'], 1)  if obb_info else '',
+                })
+
+            run = {
+                'meta': {
+                    'run_no':    run_no,
+                    'timestamp': datetime.utcnow().isoformat() + 'Z',
+                    'latency_s': pipeline_result['latency_s'],
+                    'source':    'run_pipeline',
+                },
+                'sam': {
+                    'success':          True,
+                    'latency_s':        round(sam_latency, 3),
+                    'total_detections': num_dets,
+                    'avg_confidence':   round(avg_sam_conf, 4),
+                    'average_iou':      round(avg_iou, 4),
+                    'stability_rate':   round(stability_rate, 4),
+                },
+                'clip': {
+                    'success':          bool(clip_classifications),
+                    'latency_s':        round(clip_latency, 3),
+                    'filtered_regions': len(clip_classifications),
+                },
+                'scene':    {'success': False, 'latency_s': 0.0},
+                'obb': {
+                    'success':       bool(obb_map),
+                    'latency_s':     round(obb_latency, 3),
+                    'total_objects': len(obb_map),
+                },
+                'graspnet': {
+                    'success':      bool(grasp_map),
+                    'latency_s':    round(grasp_latency, 3),
+                    'total_grasps': len(grasp_map),
+                },
+                'objects':   objects,
+                'relations': [],
+                'grasps':    list(grasp_map.values()),
+            }
+
+            history.append(run)
+            history = history[-50:]  # keep last 50 runs
+
+            with open(history_file, 'w') as f:
+                json.dump(history, f, indent=2)
+
+            self.get_logger().info(f"Saved run #{run_no} to {history_file} ({num_dets} objects)")
+
+        except Exception as e:
+            self.get_logger().warn(f"Failed to save run pipeline history: {e}")
+
     def detect_objects_callback(self, request, response):
         """Service callback for /vision/detect_objects - returns detection results directly"""
         try:
@@ -604,7 +885,7 @@ def _save_detect_objects_run(self, object_ids, bbox_x1, bbox_y1, bbox_x2, bbox_y
             }
 
             history.append(run)
-            history = history[-20:]  # keep last 20 runs
+            history = history[-50:]  # keep last 50 runs
 
             with open(history_file, 'w') as f:
                 json.dump(history, f, indent=2)
@@ -1090,157 +1371,132 @@ def _publish_detections_ros(self):
 
     def visualization_callback(self):
         """Display camera feed with detections in OpenCV window"""
-        # Use captured frame if available, otherwise latest_rgb
         frame_to_display = self.captured_frame if self.frame_captured else self.latest_rgb
-        
+
         if frame_to_display is None:
-            # Show waiting message
             blank = np.zeros((480, 640, 3), dtype=np.uint8)
-            cv2.putText(
-                blank, 
-                f"Waiting for {self.rgb_topic}...", 
-                (100, 240),
-                cv2.FONT_HERSHEY_SIMPLEX, 
-                1.0, 
-                (255, 255, 255), 
-                2
-            )
+            cv2.putText(blank, f"Waiting for {self.rgb_topic}...", (80, 240),
+                        cv2.FONT_HERSHEY_SIMPLEX, 0.65, (160, 160, 160), 1)
             cv2.imshow(self.window_name, blank)
             cv2.waitKey(1)
             return
-        
-        # Create visualization image
+
         vis_image = frame_to_display.copy()
-        
-        # Determine if we should show corner points (when detections < 3)
-        # For debug and finding u,v in image
+
+        # Distinct color palette per object (BGR)
+        COLORS = [
+            (0,  200, 255),   # amber
+            (80, 255, 80),    # lime
+            (255, 80,  80),   # blue
+            (255, 0,  200),   # magenta
+            (0,  230, 230),   # yellow
+            (200, 80, 255),   # violet
+            (0,  255, 180),   # spring green
+            (255, 180,  0),   # sky blue
+        ]
+
         show_corner_points = len(self.latest_detections) < 5
-        
-        # Draw detections
+
+        # ── Pass 1: draw all masks first (underneath boxes) ──────────────────
+        mask_overlay = vis_image.copy()
+        for idx, det in enumerate(self.latest_detections):
+            color = COLORS[idx % len(COLORS)]
+            mask = det['mask']
+            mask_overlay[mask > 0] = (
+                int(color[0] * 0.55),
+                int(color[1] * 0.55),
+                int(color[2] * 0.55),
+            )
+        vis_image = cv2.addWeighted(vis_image, 0.6, mask_overlay, 0.4, 0)
+
+        # ── Pass 2: boxes, labels, debug corners ─────────────────────────────
         for idx, det in enumerate(self.latest_detections):
             bbox = det['bbox']
             confidence = det['confidence']
             distance = det.get('distance_cm')
-            obj_no = idx  # Object number
-            
-            # Draw bounding box
-            cv2.rectangle(
-                vis_image, 
-                (bbox[0], bbox[1]), 
-                (bbox[2], bbox[3]), 
-                (0, 255, 0),  # Green
-                2
-            )
-            
-            # Display 4 corner coordinates if detections < 3
-            # Debug: Show corner coordinates when detections < 5 (for u,v verification)
+            color = COLORS[idx % len(COLORS)]
+            x1, y1, x2, y2 = bbox
+
+            # Corner-bracket bounding box (professional look)
+            clen = max(14, int(min(x2 - x1, y2 - y1) * 0.15))
+            lw = 2
+            for (px, py, dx, dy) in [
+                (x1, y1,  1,  1), (x2, y1, -1,  1),
+                (x1, y2,  1, -1), (x2, y2, -1, -1),
+            ]:
+                cv2.line(vis_image, (px, py), (px + dx * clen, py), color, lw)
+                cv2.line(vis_image, (px, py), (px, py + dy * clen), color, lw)
+            # Thin dim full rectangle
+            cv2.rectangle(vis_image, (x1, y1), (x2, y2), color, 1)
+
+            # ── Debug corner coordinates ──────────────────────────────────
             if show_corner_points:
-                font_scale = 0.4
-                font_thickness = 1
-                text_color = (0, 255, 255)  # Yellow text for visibility
-                bg_color = (0, 0, 0)  # Black background
-                padding = 2
-                
-                # Draw all 4 corners in multi-line format for better readability
                 corners_text = [
-                    f"TL:({bbox[0]},{bbox[1]})",
-                    f"TR:({bbox[2]},{bbox[1]})",
-                    f"BL:({bbox[0]},{bbox[3]})",
-                    f"BR:({bbox[2]},{bbox[3]})"
+                    f"TL:({x1},{y1})", f"TR:({x2},{y1})",
+                    f"BL:({x1},{y2})", f"BR:({x2},{y2})",
                 ]
-                
-                # Position text block above bbox
-                start_y = max(bbox[1] - 80, 20)  # Ensure it stays on screen
-                line_height = 18
-                
+                start_y = max(y1 - 68, 26)
                 for i, line_text in enumerate(corners_text):
-                    text_size, _ = cv2.getTextSize(line_text, cv2.FONT_HERSHEY_SIMPLEX, font_scale, font_thickness)
-                    y_pos = start_y + (i * line_height)
-                    
-                    # Draw background
-                    cv2.rectangle(
-                        vis_image,
-                        (bbox[0] - padding, y_pos - text_size[1] - padding),
-                        (bbox[0] + text_size[0] + padding, y_pos + padding),
-                        bg_color,
-                        -1
-                    )
-                    
-                    # Draw text
-                    cv2.putText(
-                        vis_image,
-                        line_text,
-                        (bbox[0], y_pos),
-                        cv2.FONT_HERSHEY_SIMPLEX,
-                        font_scale,
-                        text_color,
-                        font_thickness
-                    )
-            
-            # Draw filled mask with transparency
-            mask = det['mask']
-            colored_mask = np.zeros_like(vis_image)
-            colored_mask[:, :] = (0, 255, 0)  # Green overlay
-            vis_image = np.where(
-                mask[..., None] > 0,
-                cv2.addWeighted(vis_image, 0.7, colored_mask, 0.3, 0),
-                vis_image
-            )
-            
-            # Draw label with object number and distance
+                    ts, _ = cv2.getTextSize(line_text, cv2.FONT_HERSHEY_SIMPLEX, 0.33, 1)
+                    ty = start_y + i * 16
+                    cv2.rectangle(vis_image, (x1 - 2, ty - ts[1] - 2),
+                                  (x1 + ts[0] + 2, ty + 2), (15, 15, 15), -1)
+                    cv2.putText(vis_image, line_text, (x1, ty),
+                                cv2.FONT_HERSHEY_SIMPLEX, 0.33, color, 1)
+
+            # ── Label ─────────────────────────────────────────────────────
             if distance is not None:
-                label = f"#{obj_no} {det.get('class_name', det['id'])}: {confidence:.2f} ({distance:.1f}cm)"
+                label = f"#{idx} {det.get('class_name', det['id'])}  {confidence:.2f}  {distance:.1f}cm"
             else:
-                label = f"#{obj_no} {det.get('class_name', det['id'])}: {confidence:.2f}"
-            
-            label_size, _ = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, 0.6, 2)
-            
-            # Label background
-            cv2.rectangle(
-                vis_image,
-                (bbox[0], bbox[1] - label_size[1] - 10),
-                (bbox[0] + label_size[0], bbox[1]),
-                (0, 255, 0),
-                -1
-            )
-            
-            # Label text
-            cv2.putText(
-                vis_image,
-                label,
-                (bbox[0], bbox[1] - 5),
-                cv2.FONT_HERSHEY_SIMPLEX,
-                0.6,
-                (0, 0, 0),  # Black text
-                2
-            )
-        
-        # Add info overlay
+                label = f"#{idx} {det.get('class_name', det['id'])}  {confidence:.2f}"
+
+            fs, ft = 0.38, 1
+            (lw_px, lh_px), _ = cv2.getTextSize(label, cv2.FONT_HERSHEY_SIMPLEX, fs, ft)
+            pad = 4
+            accent = 3  # color accent bar width
+
+            # Place label above bbox; clamp to image top
+            ly = y1 - pad - 2
+            if ly - lh_px - pad < 0:
+                ly = y1 + lh_px + pad + 2
+
+            bx1 = x1
+            bx2 = x1 + accent + pad + lw_px + pad
+            by1 = ly - lh_px - pad
+            by2 = ly + pad
+
+            # Clamp to image bounds
+            bx1 = max(0, bx1);  by1 = max(0, by1)
+            bx2 = min(vis_image.shape[1] - 1, bx2)
+            by2 = min(vis_image.shape[0] - 1, by2)
+
+            # Semi-transparent dark background
+            roi = vis_image[by1:by2, bx1:bx2]
+            if roi.size > 0:
+                dark = np.full_like(roi, (18, 18, 18))
+                vis_image[by1:by2, bx1:bx2] = cv2.addWeighted(roi, 0.25, dark, 0.75, 0)
+
+            # Color accent bar on left
+            cv2.rectangle(vis_image, (bx1, by1), (bx1 + accent, by2), color, -1)
+
+            # White label text
+            cv2.putText(vis_image, label, (bx1 + accent + pad, ly),
+                        cv2.FONT_HERSHEY_SIMPLEX, fs, (240, 240, 240), ft)
+
+        # ── Top info bar ─────────────────────────────────────────────────────
+        h, w = vis_image.shape[:2]
+        bar_h = 22
         mode_text = "CONTINUOUS" if self.continuous_detection else "SINGLE SHOT"
-        corner_indicator = " [CORNER POINTS ON]" if show_corner_points else ""
-        info_text = f"Mode: {mode_text} | Objects: {len(self.latest_detections)}{corner_indicator}"
-        
-        cv2.putText(
-            vis_image,
-            info_text,
-            (10, 30),
-            cv2.FONT_HERSHEY_SIMPLEX,
-            0.7,
-            (255, 255, 255),  # White
-            2
-        )
-        
-        cv2.putText(
-            vis_image,
-            info_text,
-            (10, 30),
-            cv2.FONT_HERSHEY_SIMPLEX,
-            0.7,
-            (0, 0, 0),  # Black outline
-            4
-        )
-        
-        # Show image
+        obj_count = len(self.latest_detections)
+        debug_tag = "  [DEBUG]" if (show_corner_points and obj_count > 0) else ""
+        info_text = f"Mode: {mode_text}  |  Objects detected: {obj_count}{debug_tag}"
+
+        roi = vis_image[0:bar_h, 0:w]
+        dark_bar = np.full_like(roi, (12, 12, 12))
+        vis_image[0:bar_h, 0:w] = cv2.addWeighted(roi, 0.25, dark_bar, 0.75, 0)
+        cv2.putText(vis_image, info_text, (8, 15),
+                    cv2.FONT_HERSHEY_SIMPLEX, 0.42, (210, 210, 210), 1)
+
         cv2.imshow(self.window_name, vis_image)
         cv2.waitKey(1)
     

From cb8d46dce3dd5b5596627353fe490843f6da7e87 Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Sat, 11 Apr 2026 08:56:12 +0700
Subject: [PATCH 14/16] feat: find object dsahboard fix

---
 vision/clip_classifier.py          | 276 ++++++++++++++++++-----------
 vision/find_object_service_node.py |  28 +++
 vision/simple_sam_detector.py      |  20 ++-
 vision/unified_pipeline.py         |   5 +-
 4 files changed, 222 insertions(+), 107 deletions(-)

diff --git a/vision/clip_classifier.py b/vision/clip_classifier.py
index b44e029..312e3db 100755
--- a/vision/clip_classifier.py
+++ b/vision/clip_classifier.py
@@ -112,6 +112,13 @@ def __init__(self, candidate_labels: List[str] = None):
         self.declare_parameter('real_hardware', False)
         self.real_hardware = bool(self.get_parameter('real_hardware').value)
 
+        # Minimum raw cosine similarity to even consider a region a candidate.
+        # Applied before inter-region softmax normalisation; regions below this
+        # threshold are discarded entirely.  Default 0.1 rejects strongly
+        # mismatched regions while keeping borderline ones in the softmax pool.
+        self.declare_parameter('clip_min_confidence', 0.1)
+        self.clip_min_confidence = float(self.get_parameter('clip_min_confidence').value)
+
         self.rgb_topic = '/camera/color/image_raw' if self.real_hardware else '/camera/image_raw'
         self.depth_topic = '/camera/depth/image_rect_raw' if self.real_hardware else '/camera/depth/image_raw'
         self.camera_info_topic = 'camera/color/camera_info' if self.real_hardware else '/camera/camera_info'
@@ -716,11 +723,17 @@ def _call_detect_objects(self) -> Tuple[List[List[int]], Optional[str]]:
         return bboxes, None
 
     def _compute_similarity(self, image_bgr: np.ndarray, label: str) -> float:
-        """Compute CLIP cosine similarity between crop and label text."""
+        """Compute raw CLIP cosine similarity between a single crop and label text.
+
+        Returns a value roughly in [-1, 1].  Prefer
+        _compute_inter_region_confidences() when you have multiple regions,
+        as that method normalises across regions via softmax to produce proper
+        probabilities in [0, 1].
+        """
         region_rgb = cv2.cvtColor(image_bgr, cv2.COLOR_BGR2RGB)
         pil_image = PILImage.fromarray(region_rgb)
         image_input = self.preprocess(pil_image).unsqueeze(0).to(self.device)
-        text_tokens = clip.tokenize([label]).to(self.device)
+        text_tokens = clip.tokenize([f"a photo of a {label}"]).to(self.device)
 
         with torch.no_grad():
             image_features = self.model.encode_image(image_input)
@@ -731,6 +744,55 @@ def _compute_similarity(self, image_bgr: np.ndarray, label: str) -> float:
 
         return float(similarity)
 
+    def _compute_inter_region_confidences(
+        self,
+        crops_bgr: List[np.ndarray],
+        label: str,
+    ) -> List[float]:
+        """Return per-region confidence values in [0, 1] for a query label.
+
+        Rather than returning raw cosine similarity (which lives in roughly
+        [0.15, 0.35] for typical queries and is hard to threshold), this method
+        applies a temperature-scaled softmax *across all candidate regions*.
+        The result is a proper probability distribution: the region most likely
+        containing ``label`` gets a high score, the rest share the remainder.
+
+        Args:
+            crops_bgr: List of BGR image crops (one per detected region).
+            label:     Text query, e.g. ``"bowl"`` or ``"green_cube"``.
+
+        Returns:
+            List of float probabilities, same length as ``crops_bgr``,
+            summing to 1.0.  An empty list is returned when ``crops_bgr``
+            is empty.
+        """
+        if not crops_bgr:
+            return []
+
+        # Use the same prompt template as _classify_regions / _classify_image
+        text_tokens = clip.tokenize([f"a photo of a {label}"]).to(self.device)
+        with torch.no_grad():
+            text_features = self.model.encode_text(text_tokens)
+            text_features = text_features / text_features.norm(dim=-1, keepdim=True)
+
+            image_features_list = []
+            for crop_bgr in crops_bgr:
+                region_rgb = cv2.cvtColor(crop_bgr, cv2.COLOR_BGR2RGB)
+                pil_image = PILImage.fromarray(region_rgb)
+                image_input = self.preprocess(pil_image).unsqueeze(0).to(self.device)
+                img_feat = self.model.encode_image(image_input)
+                img_feat = img_feat / img_feat.norm(dim=-1, keepdim=True)
+                image_features_list.append(img_feat)
+
+            # Stack → (N, D), then cosine similarities → (N,)
+            all_image_features = torch.cat(image_features_list, dim=0)  # (N, D)
+            raw_sims = (all_image_features @ text_features.T).squeeze(1)  # (N,)
+
+        # Temperature-scaled softmax over regions: a factor of 100 matches the
+        # scale used in standard CLIP logits and keeps the distribution sharp.
+        probs = (raw_sims * 100.0).softmax(dim=0)
+        return [float(p.item()) for p in probs]
+
     def find_multi_object_callback(self, request, response):
         """
         Service callback for /vision/find_multi_object.
@@ -815,8 +877,10 @@ def find_multi_object_callback(self, request, response):
 
             frame = self.captured_frame
             frame_h, frame_w = frame.shape[:2]
-            matches: List[Dict] = []
 
+            # --- Pass 1: collect valid crops pre-filtered by raw cosine ---
+            candidates: List[Dict] = []
+            crops: List[np.ndarray] = []
             for region_id, bbox in enumerate(bboxes):
                 x1, y1, x2, y2 = bbox
                 x1 = max(0, min(x1, frame_w))
@@ -828,12 +892,25 @@ def find_multi_object_callback(self, request, response):
                     continue
 
                 region_bgr = frame[y1:y2, x1:x2]
-                similarity = self._compute_similarity(region_bgr, target_label)
-                matches.append({
+                raw_sim = self._compute_similarity(region_bgr, target_label)
+                if raw_sim < self.clip_min_confidence:
+                    continue
+                candidates.append({
                     'region_id': region_id,
                     'bbox': [int(x1), int(y1), int(x2), int(y2)],
-                    'confidence': round(float(similarity), 4),
                 })
+                crops.append(region_bgr)
+
+            matches: List[Dict] = []
+            if candidates:
+                # --- Pass 2: inter-region softmax → proper [0,1] probabilities ---
+                probs = self._compute_inter_region_confidences(crops, target_label)
+                for i, cand in enumerate(candidates):
+                    matches.append({
+                        'region_id': cand['region_id'],
+                        'bbox': cand['bbox'],
+                        'confidence': round(probs[i], 4),
+                    })
 
             matches.sort(key=lambda item: item['confidence'], reverse=True)
             top_matches = matches[:top_k]
@@ -996,80 +1073,83 @@ def find_object_callback(self, request, response):
                 
                 self.get_logger().info(f"Classification complete for {len(self.latest_region_classifications)} regions")
             
-            self.get_logger().info(f"Computing CLIP embeddings for '{target_label}' and {len(self.latest_region_classifications)} regions")
-            
-            # Compute image-text similarity for each bounding box using CLIP's high-level API
-            best_match = None
-            best_similarity = -1.0  # Cosine similarity ranges from -1 to 1
-            
+            self.get_logger().info(f"Computing CLIP confidences for '{target_label}' across {len(self.latest_region_classifications)} regions")
+
+            # --- Pass 1: collect valid crops and their metadata ---------
+            h, w = self.captured_frame.shape[:2]
+            valid_regions = []
+            crops = []
             for region in self.latest_region_classifications:
                 bbox = region['bbox']
                 x1, y1, x2, y2 = bbox
-                
-                # Clamp bbox to image bounds
-                h, w = self.captured_frame.shape[:2]
                 x1 = max(0, min(x1, w))
                 x2 = max(0, min(x2, w))
                 y1 = max(0, min(y1, h))
                 y2 = max(0, min(y2, h))
-                
-                # Skip invalid boxes
                 if x2 <= x1 or y2 <= y1:
                     self.get_logger().warn(f"Skipping invalid bbox: {bbox}")
                     continue
-                
-                # Crop and convert region
-                region_bgr = self.captured_frame[y1:y2, x1:x2]
-                region_rgb = cv2.cvtColor(region_bgr, cv2.COLOR_BGR2RGB)
-                pil_image = PILImage.fromarray(region_rgb)
-                
-                # Use OpenAI CLIP for similarity computation
-                image_input = self.preprocess(pil_image).unsqueeze(0).to(self.device)
-                text_tokens = clip.tokenize([target_label]).to(self.device)
-                
-                with torch.no_grad():
-                    image_features = self.model.encode_image(image_input)
-                    text_features = self.model.encode_text(text_tokens)
-                    
-                    # Normalize features
-                    image_features = image_features / image_features.norm(dim=-1, keepdim=True)
-                    text_features = text_features / text_features.norm(dim=-1, keepdim=True)
-                    
-                    # Compute cosine similarity (normalized dot product)
-                    similarity = (image_features @ text_features.T)[0, 0].item()
-                
-                self.get_logger().debug(f"Region {region['region_id']}: similarity = {similarity:.4f}")
-                
-                # Track best match
-                if similarity > best_similarity:
-                    best_similarity = similarity
-                    best_match = {
-                        'bbox': bbox,
-                        'confidence': similarity,
-                        'region_id': region['region_id']
-                    }
-            
-            # Check if any match was found
-            if best_match is None:
+                # Pre-filter by raw cosine similarity so obviously wrong regions
+                # don't pollute the softmax pool.
+                raw_sim = self._compute_similarity(
+                    self.captured_frame[y1:y2, x1:x2], target_label
+                )
+                if raw_sim < self.clip_min_confidence:
+                    self.get_logger().debug(
+                        f"Region {region['region_id']} discarded: raw_sim={raw_sim:.4f} "
+                        f"< clip_min_confidence={self.clip_min_confidence}"
+                    )
+                    continue
+                valid_regions.append({
+                    'bbox': [x1, y1, x2, y2],
+                    'region_id': region['region_id'],
+                })
+                crops.append(self.captured_frame[y1:y2, x1:x2])
+
+            # Check if any valid region survived the pre-filter
+            if not valid_regions:
                 response.success = False
                 response.message = f"No valid regions found to compare with '{target_label}'"
                 response.bbox = []
                 response.confidence = 0.0
                 self.latest_found_object = None
-                self.get_logger().info(f"No valid regions to compare")
+                self.get_logger().info("No valid regions to compare")
                 return response
-            
-            # Optional: Set a minimum similarity threshold
-            min_similarity_threshold = 0.2  # Adjust based on your needs
-            if best_match['confidence'] < min_similarity_threshold:
+
+            # --- Pass 2: inter-region softmax → proper probabilities ----
+            # Each crop gets a probability in [0, 1] that sums to 1 across
+            # all regions.  A high score means "this region most likely
+            # contains the queried label", which is a meaningful confidence.
+            probs = self._compute_inter_region_confidences(crops, target_label)
+
+            for i, region_info in enumerate(valid_regions):
+                region_info['confidence'] = probs[i]
+                self.get_logger().debug(
+                    f"Region {region_info['region_id']}: confidence={probs[i]:.4f}"
+                )
+
+            # Best region = highest softmax probability
+            best_match = max(valid_regions, key=lambda r: r['confidence'])
+
+            # Minimum confidence guard (now in softmax probability space).
+            # With clip_min_confidence already filtering raw similarities,
+            # this catches the degenerate single-region case where probability
+            # is trivially 1.0 but the raw match was borderline.
+            min_prob_threshold = self.clip_min_confidence
+            if best_match['confidence'] < min_prob_threshold:
                 response.success = False
-                response.message = f"Label '{target_label}' found but similarity too low ({best_match['confidence']:.3f} < {min_similarity_threshold})"
+                response.message = (
+                    f"Label '{target_label}' found but confidence too low "
+                    f"({best_match['confidence']:.3f} < {min_prob_threshold})"
+                )
                 response.bbox = []
                 response.confidence = float(best_match['confidence'])
                 self.latest_found_object = None
-                self.get_logger().info(f"Label '{target_label}' similarity too low: {best_match['confidence']:.3f}")
+                self.get_logger().info(
+                    f"Label '{target_label}' confidence too low: {best_match['confidence']:.3f}"
+                )
                 return response
-            
+
             # Store for visualization
             self.latest_found_object = {
                 'label': target_label,
@@ -1077,17 +1157,17 @@ def find_object_callback(self, request, response):
                 'confidence': best_match['confidence'],
                 'region_id': best_match['region_id']
             }
-            
+
             # Return success with bbox
             response.success = True
-            response.message = f"Found '{target_label}' with similarity {best_match['confidence']:.3f}"
+            response.message = f"Found '{target_label}' with confidence {best_match['confidence']:.3f}"
             response.bbox = best_match['bbox']
             response.confidence = float(best_match['confidence'])
             # Note: FindObject.srv doesn't have object_id field (only FindObjectReal.srv does)
-            
+
             self.get_logger().info(
                 f"Found '{target_label}': bbox={best_match['bbox']}, "
-                f"similarity={best_match['confidence']:.3f}, region_id={best_match['region_id']}"
+                f"confidence={best_match['confidence']:.3f}, region_id={best_match['region_id']}"
             )
             
         except Exception as e:
@@ -1117,21 +1197,18 @@ def _classify_image(self, rgb_image: np.ndarray) -> Dict:
         # Convert BGR to RGB
         rgb = cv2.cvtColor(rgb_image, cv2.COLOR_BGR2RGB)
         pil_image = PILImage.fromarray(rgb)
-        
-        # Prepare inputs using OpenAI CLIP
+
+        # Prompt template improves accuracy over bare label names (CLIP paper)
+        prompted_labels = [f"a photo of a {lbl}" for lbl in self.candidate_labels]
+
         image_input = self.preprocess(pil_image).unsqueeze(0).to(self.device)
-        text_tokens = clip.tokenize(self.candidate_labels).to(self.device)
-        
-        # Get predictions
+        text_tokens = clip.tokenize(prompted_labels).to(self.device)
+
         with torch.no_grad():
             image_features = self.model.encode_image(image_input)
             text_features = self.model.encode_text(text_tokens)
-            
-            # Normalize features
             image_features = image_features / image_features.norm(dim=-1, keepdim=True)
             text_features = text_features / text_features.norm(dim=-1, keepdim=True)
-            
-            # Calculate similarity (logits)
             logits_per_image = (100.0 * image_features @ text_features.T)
             probs = logits_per_image.softmax(dim=-1)[0]
         
@@ -1190,61 +1267,60 @@ def _classify_regions(self, rgb_image: np.ndarray, bboxes: List[List[int]]) -> D
         start_time = time.time()
         
         classified_regions = []
-        
+
+        # Encode text once for all regions.  The candidate labels never change
+        # within a call, so there is no reason to re-tokenize per region.
+        # Prompt template "a photo of a {label}" matches CLIP's training
+        # distribution far better than bare label names and measurably improves
+        # zero-shot accuracy (CLIP paper: +~13 pp on ImageNet).
+        prompted_labels = [f"a photo of a {lbl}" for lbl in self.candidate_labels]
+        with torch.no_grad():
+            text_tokens = clip.tokenize(prompted_labels).to(self.device)
+            text_features = self.model.encode_text(text_tokens)
+            text_features = text_features / text_features.norm(dim=-1, keepdim=True)
+
+        h, w = rgb_image.shape[:2]
+
         for region_id, bbox in enumerate(bboxes):
             x1, y1, x2, y2 = bbox
-            
+
             # Clamp bbox to image bounds
-            h, w = rgb_image.shape[:2]
             x1 = max(0, min(x1, w))
             x2 = max(0, min(x2, w))
             y1 = max(0, min(y1, h))
             y2 = max(0, min(y2, h))
-            
+
             # Skip invalid boxes
             if x2 <= x1 or y2 <= y1:
                 self.get_logger().warn(f"Skipping invalid bbox: {bbox}")
                 continue
-            
+
             # Crop region
             region_bgr = rgb_image[y1:y2, x1:x2]
-            
-            # Convert BGR to RGB
             region_rgb = cv2.cvtColor(region_bgr, cv2.COLOR_BGR2RGB)
             pil_image = PILImage.fromarray(region_rgb)
-            
-            # Prepare inputs using OpenAI CLIP
+
             image_input = self.preprocess(pil_image).unsqueeze(0).to(self.device)
-            text_tokens = clip.tokenize(self.candidate_labels).to(self.device)
-            
-            # Get predictions
+
             with torch.no_grad():
                 image_features = self.model.encode_image(image_input)
-                text_features = self.model.encode_text(text_tokens)
-                
-                # Normalize features
                 image_features = image_features / image_features.norm(dim=-1, keepdim=True)
-                text_features = text_features / text_features.norm(dim=-1, keepdim=True)
-                
-                # Calculate similarity (logits)
+
+                # Intra-label softmax: probability over the closed label set.
+                # Range [0, 1], sums to 1 across labels for this region.
                 logits_per_image = (100.0 * image_features @ text_features.T)
                 probs = logits_per_image.softmax(dim=-1)[0]
-            
-            # Convert to numpy
+
             probs_np = probs.cpu().numpy()
-            
-            # Sort predictions by confidence
             sorted_indices = np.argsort(probs_np)[::-1]
-            
-            # Build predictions list
+
             all_predictions = []
             for idx in sorted_indices:
                 all_predictions.append({
                     "label": self.candidate_labels[idx],
                     "confidence": round(float(probs_np[idx]), 2)
                 })
-            
-            # Build region result
+
             region_result = {
                 "region_id": region_id,
                 "bbox": [int(x1), int(y1), int(x2), int(y2)],
@@ -1252,9 +1328,9 @@ def _classify_regions(self, rgb_image: np.ndarray, bboxes: List[List[int]]) -> D
                     "label": all_predictions[0]["label"],
                     "confidence": all_predictions[0]["confidence"]
                 },
-                "all_predictions": all_predictions[:10]  # Top 10
+                "all_predictions": all_predictions[:10]
             }
-            
+
             classified_regions.append(region_result)
         
         # Calculate processing time
diff --git a/vision/find_object_service_node.py b/vision/find_object_service_node.py
index 31ec056..aca35af 100644
--- a/vision/find_object_service_node.py
+++ b/vision/find_object_service_node.py
@@ -9,6 +9,10 @@
 ros2 service call /find_object custom_interfaces/srv/FindObjectReal "{label: 'bowl'}"
 
 confidence calculate by SAM detection based
+
+json file kept at
+/home/group11/final_project_ws/install/vision/lib/python3.12/site-packages/find_object_history.json
+
 """
 
 # TCP_OFFSET = 0.157 # Actual TCP_OFFSET value from teach pendant
@@ -23,6 +27,10 @@ def __init__(self):
         self.declare_parameter('tcp_offset', False)
         self.tcp_offset = bool(self.get_parameter('tcp_offset').value)
         
+        # Minimum confidence threshold for find_object responses
+        self.declare_parameter('find_object_min_confidence', 0.255)
+        self.find_object_min_confidence = float(self.get_parameter('find_object_min_confidence').value)
+        
         # Use reentrant callback group to allow nested service calls
         self.callback_group = ReentrantCallbackGroup()
         
@@ -207,6 +215,26 @@ def find_object_callback(self, request, response):
                 response.z = 0.0
                 response.theta = 0.0
                 return response
+
+            if find_response.confidence < self.find_object_min_confidence:
+                response.success = False
+                response.message = (
+                    f'Object confidence too low ({find_response.confidence:.3f} < '
+                    f'{self.find_object_min_confidence:.3f}); cannot reliably find object in camera'
+                )
+                response.object_id = ''
+                response.bbox = []
+                response.confidence = float(find_response.confidence)
+                response.x = 0.0
+                response.y = 0.0
+                response.z = 0.0
+                response.theta = 0.0
+                self.get_logger().warn(
+                    f'find_object confidence below threshold: {find_response.confidence:.3f} '
+                    f'(threshold={self.find_object_min_confidence:.3f})'
+                )
+                self._log_find_object_call(label, response)
+                return response
             
             # Extract object_id from find_response
             object_id = find_response.object_id if hasattr(find_response, 'object_id') else ''
diff --git a/vision/simple_sam_detector.py b/vision/simple_sam_detector.py
index fdff486..ca05e1d 100755
--- a/vision/simple_sam_detector.py
+++ b/vision/simple_sam_detector.py
@@ -689,14 +689,17 @@ def detect_objects_callback(self, request, response):
                 clip_info = clip_classifications.get(idx)
                 
                 if clip_info:
-                    # Use CLIP label and confidence
+                    # Confidence = CLIP softmax probability over candidate labels [0, 1]
                     object_ids.append(f"{clip_info['label']}_{idx}")
                     confidences.append(float(clip_info['confidence']))
                     self.get_logger().info(f"  Region {idx}: {clip_info['label']} (CLIP confidence: {clip_info['confidence']:.2f})")
                 else:
-                    # Use SAM generic label
+                    # No CLIP result — fall back to SAM shape score (circularity-based,
+                    # range [0.50, 0.95]).  This is NOT a semantic confidence; it only
+                    # reflects contour regularity.
                     object_ids.append(det['id'])
                     confidences.append(float(det['confidence']))
+                    self.get_logger().debug(f"  Region {idx}: no CLIP result, using SAM shape score={det['confidence']:.2f}")
                 
                 bbox = det['bbox']
                 bbox_x1.append(bbox[0])
@@ -1104,12 +1107,17 @@ def _detect_objects(self, rgb_image: np.ndarray) -> List[Dict]:
             mask = np.zeros((h, w), dtype=np.uint8)
             cv2.drawContours(mask, [contour], -1, 255, -1)
             
-            # Calculate confidence based on contour properties
+            # Shape-based segmentation score (NOT a model prediction probability).
+            # Circularity (4π·area / perimeter²) measures how "blob-like" the
+            # contour is: 1.0 = perfect circle, <1.0 = irregular shape.
+            # Score range: [0.50, 0.95].  This is used as a proxy for
+            # segmentation quality when no model IoU score is available.
+            # Downstream consumers should treat this as `sam_shape_score`,
+            # NOT as a semantic classification confidence.
             perimeter = cv2.arcLength(contour, True)
             circularity = 4 * np.pi * area / (perimeter * perimeter) if perimeter > 0 else 0
-            confidence = min(0.95, 0.50 + circularity * 0.45)  # More lenient baseline
-            
-            # Relaxed confidence threshold (was 0.4, now 0.3)
+            confidence = min(0.95, 0.50 + circularity * 0.45)
+
             if confidence <= 0.3:
                 continue
             
diff --git a/vision/unified_pipeline.py b/vision/unified_pipeline.py
index e47cefa..f3a9111 100644
--- a/vision/unified_pipeline.py
+++ b/vision/unified_pipeline.py
@@ -287,7 +287,10 @@ def _call_clip_classification(self) -> Dict[int, Dict]:
                 clip_map[region_id] = {
                     "label": region.get('label'),
                     "confidence": float(region.get('confidence', 0.0)),
-                    "is_top1_accurate": region.get('confidence', 0.0) >= 0.5  # Top-1 if confidence >= 0.5
+                    # confidence here is a softmax probability over candidate labels.
+                    # >= 0.5 means the model assigns more probability to this label
+                    # than to all other candidates combined — a high-precision bar.
+                    "is_top1_accurate": region.get('confidence', 0.0) >= 0.5
                 }
             
             return clip_map

From f903d3441381aa1b10c3edf939f1cb21fd85d6ec Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Sat, 11 Apr 2026 21:42:58 +0700
Subject: [PATCH 15/16] feat: add clip and obb to dashboard

---
 dashboard/index.html             | 267 ++++++++++++++++++++++++++++---
 vision/benchmark_dashboard.py    | 104 ++++++++++--
 vision/clip_classifier.py        | 138 +++++++++++++---
 vision/obb_angle_service_node.py |  66 +++++++-
 4 files changed, 514 insertions(+), 61 deletions(-)

diff --git a/dashboard/index.html b/dashboard/index.html
index 241e612..65cfee0 100644
--- a/dashboard/index.html
+++ b/dashboard/index.html
@@ -764,6 +764,46 @@
                     </tbody>
                 </table>
             </div>
+
+            <!-- find_object_angle_bb direct call history -->
+            <div style="margin-top:18px">
+                <div style="font-size:12px;font-weight:600;color:var(--text-secondary);margin-bottom:8px;letter-spacing:.4px">
+                    /obb/find_object_angle_bb — Direct Call History
+                    <span id="obbBBCount" style="margin-left:8px;background:#f97316;color:#fff;border-radius:10px;padding:1px 8px;font-size:11px">0</span>
+                </div>
+                <div class="metric-strip" style="margin-bottom:8px">
+                    <div class="metric-tile">
+                        <div class="metric-val" id="obbBBLatestAngle">—</div>
+                        <div class="metric-lbl">Latest Angle (°)</div>
+                    </div>
+                    <div class="metric-tile">
+                        <div class="metric-val" id="obbBBAvgAngle">—</div>
+                        <div class="metric-lbl">Avg Angle (°)</div>
+                    </div>
+                    <div class="metric-tile">
+                        <div class="metric-val" id="obbBBLatestObject">—</div>
+                        <div class="metric-lbl">Latest Object</div>
+                    </div>
+                </div>
+                <div class="table-wrap">
+                    <table>
+                        <thead><tr>
+                            <th>#</th>
+                            <th>Object ID</th>
+                            <th>Angle (°)</th>
+                            <th>Theta (rad)</th>
+                            <th>Center (u, v)</th>
+                            <th>Size (w × h px)</th>
+                            <th>Input BBox</th>
+                            <th>IoU</th>
+                            <th>Timestamp</th>
+                        </tr></thead>
+                        <tbody id="obbBBBody">
+                            <tr class="no-data-row"><td colspan="9">No data — call <code>ros2 service call /obb/find_object_angle_bb ...</code></td></tr>
+                        </tbody>
+                    </table>
+                </div>
+            </div>
         </div>
 
         <!-- ── SAM ──────────────────────────────────────────────────── -->
@@ -834,17 +874,59 @@
                 <table>
                     <thead><tr>
                         <th>Test ID</th>
-                        <th>Label</th>
+                        <th>CLIP Label</th>
                         <th>Confidence</th>
                         <th>Top-1 Accuracy</th>
+                        <th>Human Verdict</th>
                         <th>Bounding Box</th>
                         <th>Timestamp</th>
                     </tr></thead>
                     <tbody id="clipBody">
-                        <tr class="no-data-row"><td colspan="6">No CLIP data — start <code>/vision/classify_bbox_filtered</code></td></tr>
+                        <tr class="no-data-row"><td colspan="7">No CLIP data — call <code>ros2 service call /vision/classify_bbox_filtered std_srvs/srv/Trigger</code></td></tr>
                     </tbody>
                 </table>
             </div>
+
+            <!-- classify_all history sub-section -->
+            <div style="margin-top:18px">
+                <div style="font-size:12px;font-weight:600;color:var(--text-secondary);margin-bottom:8px;letter-spacing:.4px">
+                    /vision/classify_all — Direct Call History
+                    <span id="caCount" style="margin-left:8px;background:var(--color-clip);color:#fff;border-radius:10px;padding:1px 8px;font-size:11px">0</span>
+                </div>
+                <div class="metric-strip" style="margin-bottom:8px">
+                    <div class="metric-tile">
+                        <div class="metric-val" id="caLatestLabel">—</div>
+                        <div class="metric-lbl">Latest Top Label</div>
+                    </div>
+                    <div class="metric-tile">
+                        <div class="metric-val" id="caLatestConf">—</div>
+                        <div class="metric-lbl">Latest Confidence</div>
+                    </div>
+                    <div class="metric-tile">
+                        <div class="metric-val" id="caAvgConf">—</div>
+                        <div class="metric-lbl">Avg Confidence</div>
+                    </div>
+                    <div class="metric-tile">
+                        <div class="metric-val" id="caAvgLatency">—</div>
+                        <div class="metric-lbl">Avg Latency (s)</div>
+                    </div>
+                </div>
+                <div class="table-wrap">
+                    <table>
+                        <thead><tr>
+                            <th>#</th>
+                            <th>Top Label</th>
+                            <th>Confidence</th>
+                            <th>Top-5 Predictions</th>
+                            <th>Latency (s)</th>
+                            <th>Timestamp</th>
+                        </tr></thead>
+                        <tbody id="caBody">
+                            <tr class="no-data-row"><td colspan="6">No data — call <code>ros2 service call /vision/classify_all std_srvs/srv/Trigger</code></td></tr>
+                        </tbody>
+                    </table>
+                </div>
+            </div>
         </div>
 
         <!-- ── GraspNet ──────────────────────────────────────────────── -->
@@ -1024,10 +1106,18 @@
     // ── /api/data ─────────────────────────────────────────────────────────────
     let lastData = null;
 
+    // Holds latest filtered records so updateDashboard can merge them
+    let _latestFilteredRecords = [];
+
     async function fetchData() {
         try {
             const res = await fetch('/api/data');
             lastData = await res.json();
+            // Also refresh filtered history in the same tick
+            try {
+                const fr = await fetch('/api/classify-filtered-history');
+                _latestFilteredRecords = await fr.json();
+            } catch (_) { _latestFilteredRecords = []; }
             updateDashboard(lastData);
         } catch (e) {
             console.warn('Error fetching /api/data:', e);
@@ -1035,22 +1125,26 @@
     }
 
     function updateDashboard(data) {
+        // Merge /vision/classify_bbox_filtered records directly into clip table
+        const clipRecords = (data.clip_classifications || []).concat(_latestFilteredRecords);
+        const clipCount   = clipRecords.length;
+
         document.getElementById('totalCalls').textContent = data.metadata.total_calls;
         document.getElementById('pixelCount').textContent  = data.pixel_to_real.length;
         document.getElementById('samCount').textContent    = data.sam_detections.length;
-        document.getElementById('clipCount').textContent   = data.clip_classifications.length;
+        document.getElementById('clipCount').textContent   = clipCount;
         document.getElementById('graspCount').textContent  = data.grasp_detections.length;
         document.getElementById('sceneCount').textContent  = data.scene_understanding.length;
 
         setNav('nav-sam',   data.sam_detections.length);
-        setNav('nav-clip',  data.clip_classifications.length);
+        setNav('nav-clip',  clipCount);
         setNav('nav-grasp', data.grasp_detections.length);
         setNav('nav-scene', data.scene_understanding.length);
         setNav('nav-pixel', data.pixel_to_real.length);
 
         updatePixelToReal(data.pixel_to_real);
         updateSAMDetections(data.sam_detections);
-        updateCLIPClassifications(data.clip_classifications);
+        updateCLIPClassifications(clipRecords);
         updateGraspDetections(data.grasp_detections);
         updateSceneUnderstanding(data.scene_understanding);
 
@@ -1127,32 +1221,71 @@
         </tr>`).join('');
     }
 
+    // ── CLIP verdict buttons ──────────────────────────────────────────────────
+    async function clipVerdict(testId, verdict) {
+        try {
+            await fetch('/api/clip-verdict', {
+                method: 'POST',
+                headers: {'Content-Type': 'application/json'},
+                body: JSON.stringify({test_id: testId, verdict})
+            });
+            // Refresh immediately so button state updates
+            _latestFilteredRecords = [];
+            try {
+                const fr = await fetch('/api/classify-filtered-history');
+                _latestFilteredRecords = await fr.json();
+            } catch (_) {}
+            if (lastData) updateCLIPClassifications(
+                (lastData.clip_classifications || []).concat(_latestFilteredRecords)
+            );
+        } catch (e) { console.warn('clip verdict error:', e); }
+    }
+
     // ── CLIP Classifications ──────────────────────────────────────────────────
     function updateCLIPClassifications(records) {
         document.getElementById('clipBadge').textContent = `${records.length} Records`;
         const tbody = document.getElementById('clipBody');
         if (!records.length) {
-            tbody.innerHTML = '<tr class="no-data-row"><td colspan="6">No CLIP data — start <code>/vision/classify_bbox_filtered</code></td></tr>';
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="7">No CLIP data — call <code>ros2 service call /vision/classify_bbox_filtered std_srvs/srv/Trigger</code></td></tr>';
             ['clipTop1','clipAvgConf'].forEach(id => document.getElementById(id).textContent = '—');
             return;
         }
-        const withAcc = records.filter(r => r.top1_accuracy !== null);
-        const top1Acc = withAcc.length
-            ? (withAcc.filter(r => r.top1_accuracy).length / withAcc.length * 100).toFixed(1) + '%'
-            : 'N/A';
+        // Top-1 accuracy computed only from records where human has given verdict
+        const withVerdict = records.filter(r => r.top1_accuracy !== null && r.top1_accuracy !== undefined);
+        const top1Acc = withVerdict.length
+            ? (withVerdict.filter(r => r.top1_accuracy).length / withVerdict.length * 100).toFixed(1) + '%'
+            : 'Pending';
         const avgConf = records.reduce((s, r) => s + r.confidence, 0) / records.length;
 
-        document.getElementById('clipTop1').textContent   = top1Acc;
+        document.getElementById('clipTop1').textContent    = top1Acc;
         document.getElementById('clipAvgConf').textContent = avgConf.toFixed(3);
 
-        tbody.innerHTML = records.slice(-50).reverse().map(r => `<tr>
-            <td class="mono">${r.test_id}</td>
-            <td><span class="chip chip-label">${r.label}</span></td>
-            <td>${confBar(r.confidence)}</td>
-            <td>${formatAccuracy(r.top1_accuracy)}</td>
-            <td class="mono" style="font-size:11px">${JSON.stringify(r.bbox)}</td>
-            <td>${tsShort(r.timestamp)}</td>
-        </tr>`).join('');
+        tbody.innerHTML = records.slice(-50).reverse().map(r => {
+            // Verdict display
+            let verdictCell;
+            if (r.top1_accuracy === true) {
+                verdictCell = `<span style="color:var(--ok);font-weight:600">✓ Correct</span>
+                    <button onclick="clipVerdict(${r.test_id}, false)" style="margin-left:6px;font-size:10px;padding:1px 5px;cursor:pointer;border:1px solid var(--border);border-radius:4px;background:#fff">✗</button>`;
+            } else if (r.top1_accuracy === false) {
+                verdictCell = `<span style="color:var(--fail);font-weight:600">✗ Wrong</span>
+                    <button onclick="clipVerdict(${r.test_id}, true)" style="margin-left:6px;font-size:10px;padding:1px 5px;cursor:pointer;border:1px solid var(--border);border-radius:4px;background:#fff">✓</button>`;
+            } else {
+                verdictCell = `<button onclick="clipVerdict(${r.test_id}, true)"  style="font-size:11px;padding:2px 8px;cursor:pointer;border:1px solid var(--ok);color:var(--ok);border-radius:4px;background:#fff;margin-right:4px">✓ Correct</button>
+                               <button onclick="clipVerdict(${r.test_id}, false)" style="font-size:11px;padding:2px 8px;cursor:pointer;border:1px solid var(--fail);color:var(--fail);border-radius:4px;background:#fff">✗ Wrong</button>`;
+            }
+            const bboxStr = r.bbox ? (typeof r.bbox === 'object' && !Array.isArray(r.bbox)
+                ? `(${r.bbox.x1},${r.bbox.y1})→(${r.bbox.x2},${r.bbox.y2})`
+                : JSON.stringify(r.bbox)) : '—';
+            return `<tr>
+                <td class="mono">${r.test_id}</td>
+                <td><span class="chip chip-label">${r.label}</span></td>
+                <td>${confBar(r.confidence)}</td>
+                <td>${r.top1_accuracy === true ? '<span style="color:var(--ok)">TRUE</span>' : r.top1_accuracy === false ? '<span style="color:var(--fail)">FALSE</span>' : '<span style="color:var(--text-muted)">—</span>'}</td>
+                <td>${verdictCell}</td>
+                <td class="mono" style="font-size:11px">${bboxStr}</td>
+                <td>${tsShort(r.timestamp)}</td>
+            </tr>`;
+        }).join('');
     }
 
     // ── Grasp Detections ──────────────────────────────────────────────────────
@@ -1386,6 +1519,94 @@
         }).join('');
     }
 
+    // ── /vision/classify_all history ─────────────────────────────────────────
+    async function fetchClassifyAllHistory() {
+        try {
+            const res = await fetch('/api/classify-all-history');
+            if (!res.ok) return;
+            const records = await res.json();
+            updateClassifyAllHistory(records);
+        } catch (_) {}
+    }
+
+    function updateClassifyAllHistory(records) {
+        document.getElementById('caCount').textContent = records.length;
+        const tbody = document.getElementById('caBody');
+        if (!records.length) {
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="6">No data — call <code>ros2 service call /vision/classify_all std_srvs/srv/Trigger</code></td></tr>';
+            ['caLatestLabel','caLatestConf','caAvgConf','caAvgLatency'].forEach(id => document.getElementById(id).textContent = '—');
+            return;
+        }
+        const latest = records[records.length - 1];
+        document.getElementById('caLatestLabel').textContent = latest.top_label || '—';
+        document.getElementById('caLatestConf').textContent  = latest.top_confidence != null ? (latest.top_confidence * 100).toFixed(1) + '%' : '—';
+        const avgConf = records.reduce((s, r) => s + (r.top_confidence || 0), 0) / records.length;
+        document.getElementById('caAvgConf').textContent = (avgConf * 100).toFixed(1) + '%';
+        const avgLat  = records.reduce((s, r) => s + (r.latency_s || 0), 0) / records.length;
+        document.getElementById('caAvgLatency').textContent = avgLat.toFixed(3) + ' s';
+
+        tbody.innerHTML = records.slice(-50).reverse().map(r => {
+            const top5 = (r.all_predictions || []).slice(0, 5).map(p =>
+                `<span class="chip chip-label" style="font-size:10px">${p.label} <strong>${(p.confidence*100).toFixed(0)}%</strong></span>`
+            ).join(' ');
+            return `<tr>
+                <td class="mono">${r.call_id}</td>
+                <td><span class="chip chip-label" style="background:var(--color-clip);color:#fff">${r.top_label}</span></td>
+                <td>${confBar(r.top_confidence)}</td>
+                <td style="max-width:280px;overflow:hidden">${top5}</td>
+                <td class="mono">${r.latency_s != null ? r.latency_s.toFixed(3) : '—'}</td>
+                <td>${tsShort(r.timestamp)}</td>
+            </tr>`;
+        }).join('');
+    }
+
+    // ── /obb/find_object_angle_bb history ────────────────────────────────────
+    async function fetchObbBBHistory() {
+        try {
+            const res = await fetch('/api/obb-bb-history');
+            if (!res.ok) return;
+            const records = await res.json();
+            updateObbBBHistory(records);
+        } catch (_) {}
+    }
+
+    function updateObbBBHistory(records) {
+        document.getElementById('obbBBCount').textContent = records.length;
+        const tbody = document.getElementById('obbBBBody');
+        if (!records.length) {
+            tbody.innerHTML = '<tr class="no-data-row"><td colspan="9">No data — call <code>ros2 service call /obb/find_object_angle_bb ...</code></td></tr>';
+            ['obbBBLatestAngle','obbBBAvgAngle','obbBBLatestObject'].forEach(id => document.getElementById(id).textContent = '—');
+            return;
+        }
+        const latest = records[records.length - 1];
+        document.getElementById('obbBBLatestAngle').textContent  = latest.angle_deg != null ? latest.angle_deg.toFixed(1) + '°' : '—';
+        document.getElementById('obbBBLatestObject').textContent = latest.object_id || '—';
+        const avgAngle = records.reduce((s, r) => s + (r.angle_deg || 0), 0) / records.length;
+        document.getElementById('obbBBAvgAngle').textContent = avgAngle.toFixed(1) + '°';
+
+        tbody.innerHTML = records.slice(-50).reverse().map(r => {
+            const pct      = Math.round(((r.angle_deg + 90) / 180) * 100);
+            const barColor = Math.abs(r.angle_deg) < 20 ? 'var(--ok)' : Math.abs(r.angle_deg) < 60 ? 'var(--warn)' : 'var(--fail)';
+            const bb = r.input_bbox || [];
+            return `<tr>
+                <td class="mono">${r.call_id}</td>
+                <td class="mono">${r.object_id ?? '—'}</td>
+                <td>
+                    <div class="conf-bar">
+                        <div class="conf-track" style="width:70px"><div class="conf-fill" style="width:${pct}%;background:${barColor}"></div></div>
+                        <span class="conf-num" style="color:${barColor};min-width:50px">${r.angle_deg.toFixed(1)}°</span>
+                    </div>
+                </td>
+                <td class="mono">${r.theta_rad != null ? r.theta_rad.toFixed(4) : '—'}</td>
+                <td class="mono">${r.center_u != null ? Math.round(r.center_u) : '—'}, ${r.center_v != null ? Math.round(r.center_v) : '—'}</td>
+                <td class="mono">${r.width_px != null ? Math.round(r.width_px) : '—'} × ${r.height_px != null ? Math.round(r.height_px) : '—'}</td>
+                <td class="mono" style="font-size:11px">${bb.length === 4 ? `(${bb[0]},${bb[1]})→(${bb[2]},${bb[3]})` : '—'}</td>
+                <td class="mono">${r.iou != null ? r.iou.toFixed(3) : '—'}</td>
+                <td>${tsShort(r.timestamp)}</td>
+            </tr>`;
+        }).join('');
+    }
+
     // ── Clear data (legacy) ───────────────────────────────────────────────────
     async function clearData() {
         if (confirm('Clear all in-session benchmark data?')) {
@@ -1394,10 +1615,14 @@
     }
 
     // ── Polling ───────────────────────────────────────────────────────────────
-    setInterval(fetchData,       2000);
-    setInterval(fetchRunHistory, 2000);
+    setInterval(fetchData,             2000);
+    setInterval(fetchRunHistory,       2000);
+    setInterval(fetchClassifyAllHistory, 3000);
+    setInterval(fetchObbBBHistory,       3000);
     fetchData();
     fetchRunHistory();
+    fetchClassifyAllHistory();
+    fetchObbBBHistory();
 </script>
 </body>
 </html>
diff --git a/vision/benchmark_dashboard.py b/vision/benchmark_dashboard.py
index 67ef805..4958021 100644
--- a/vision/benchmark_dashboard.py
+++ b/vision/benchmark_dashboard.py
@@ -16,6 +16,10 @@
 Usage:
     ros2 run vision benchmark_dashboard
     
+
+    ros2 service call /benchmark/clear_data std_srvs/srv/Trigger
+
+
     Then open browser: http://localhost:8080
 """
 
@@ -317,19 +321,11 @@ def add_grasp_detection_record(self, grasp_pose):
         self.data['metadata']['total_calls'] += 1
     
     def sync_from_run_history(self):
-        """Sync CLIP, GraspNet, OBB, and Pixel-to-Real data from vision_runs_history.json
-        so the /api/data endpoint (CLIP / GraspNet / Pixel-to-Real sections) stays populated
-        even when those dedicated service nodes are not running."""
+        """Sync CLIP, GraspNet, OBB, and Pixel-to-Real data from history files
+        so the /api/data endpoint stays populated even when service nodes are not running."""
         try:
             from pathlib import Path
-            history_file = Path(__file__).parent.parent / 'vision_runs_history.json'
-            if not history_file.exists():
-                return
-
-            with open(history_file, 'r') as f:
-                runs = json.load(f)
-            if not isinstance(runs, list) or not runs:
-                return
+            package_path = Path(__file__).parent.parent
 
             timestamp = datetime.now().isoformat()
 
@@ -339,6 +335,17 @@ def sync_from_run_history(self):
             new_pixel  = []
             new_obb    = []
 
+            history_file = package_path / 'vision_runs_history.json'
+            runs = []
+            if history_file.exists():
+                try:
+                    with open(history_file, 'r') as f:
+                        data = json.load(f)
+                    if isinstance(data, list):
+                        runs = data
+                except Exception:
+                    runs = []
+
             for run in runs:
                 run_ts    = run.get('meta', {}).get('timestamp', timestamp)
                 run_no    = run.get('meta', {}).get('run_no', 0)
@@ -416,6 +423,17 @@ def sync_from_run_history(self):
                                      obj.get('bbox_x2', 0), obj.get('bbox_y2', 0)],
                         })
 
+            # Also merge records from /vision/classify_bbox_filtered direct calls
+            filtered_file = Path(__file__).parent.parent / 'classify_filtered_history.json'
+            if filtered_file.exists():
+                try:
+                    with open(filtered_file, 'r') as f:
+                        filtered_records = json.load(f)
+                    if filtered_records:
+                        new_clip = (new_clip + filtered_records)[-1000:]
+                except Exception:
+                    pass
+
             # Only update if we got new data (avoids overwriting live topic data with empty)
             if new_clip:
                 self.data['clip_classifications'] = new_clip[-1000:]
@@ -436,7 +454,7 @@ def publish_data(self):
         self.data_publisher.publish(msg)
 
     def clear_data_callback(self, request, response):
-        """Clear all benchmark data"""
+        """Clear all benchmark data (in-memory + persistent JSON files)"""
         self.data = {
             'pixel_to_real': [],
             'sam_detections': [],
@@ -450,10 +468,27 @@ def clear_data_callback(self, request, response):
             }
         }
 
+        # Also wipe the persistent history files so sync_from_run_history
+        # doesn't immediately repopulate from stale data
+        package_path = Path(__file__).parent.parent
+        files_to_clear = [
+            'vision_runs_history.json',
+            'classify_filtered_history.json',
+            'classify_all_history.json',
+            'obb_bb_history.json',
+        ]
+        for fname in files_to_clear:
+            fpath = package_path / fname
+            if fpath.exists():
+                try:
+                    with open(fpath, 'w') as f:
+                        json.dump([], f)
+                except Exception as e:
+                    self.get_logger().warn(f'Could not clear {fname}: {e}')
+
         response.success = True
         response.message = "Benchmark data cleared"
-
-        self.get_logger().info('Benchmark data cleared')
+        self.get_logger().info('Benchmark data cleared (memory + files)')
         return response
     
     def start_http_server(self):
@@ -532,6 +567,21 @@ def do_GET(self):
                     data = self._read_json_file(fo_file, [])
                     self._json_response(data)
 
+                elif self.path == '/api/classify-all-history':
+                    ca_file = package_path / 'classify_all_history.json'
+                    data = self._read_json_file(ca_file, [])
+                    self._json_response(data)
+
+                elif self.path == '/api/classify-filtered-history':
+                    cf_file = package_path / 'classify_filtered_history.json'
+                    data = self._read_json_file(cf_file, [])
+                    self._json_response(data)
+
+                elif self.path == '/api/obb-bb-history':
+                    obb_file = package_path / 'obb_bb_history.json'
+                    data = self._read_json_file(obb_file, [])
+                    self._json_response(data)
+
                 else:
                     super().do_GET()
 
@@ -555,9 +605,35 @@ def do_POST(self):
                     self._write_json_file(fo_file, [])
                     self._json_response({'ok': True})
 
+                elif self.path == '/api/clip-verdict':
+                    self._handle_clip_verdict(payload)
+
                 else:
                     self._json_response({'error': 'unknown endpoint'}, 404)
 
+            # ── /api/clip-verdict ─────────────────────────────────────────
+            def _handle_clip_verdict(self, payload):
+                """Set human-in-the-loop top1_accuracy verdict for a CLIP record."""
+                test_id = payload.get('test_id')
+                verdict = payload.get('verdict')  # True / False
+                if test_id is None or verdict is None:
+                    self._json_response({'error': 'test_id and verdict required'}, 400)
+                    return
+
+                cf_file = package_path / 'classify_filtered_history.json'
+                history = self._read_json_file(cf_file, [])
+                updated = False
+                for entry in history:
+                    if entry.get('test_id') == test_id:
+                        entry['top1_accuracy'] = bool(verdict)
+                        updated = True
+                        break
+                if updated:
+                    self._write_json_file(cf_file, history)
+                    self._json_response({'ok': True})
+                else:
+                    self._json_response({'error': f'test_id {test_id} not found'}, 404)
+
             # ── /api/find-object ──────────────────────────────────────────
             def _handle_find_object(self, payload):
                 """Call /find_object ROS2 service and persist result."""
diff --git a/vision/clip_classifier.py b/vision/clip_classifier.py
index 312e3db..9004e42 100755
--- a/vision/clip_classifier.py
+++ b/vision/clip_classifier.py
@@ -129,6 +129,14 @@ def __init__(self, candidate_labels: List[str] = None):
             # "cobot",
             "green_cube",
             "drill",
+            "remote_control",
+            "orange_cube",
+            "orange_cylinder",
+            "arduino_board",
+            "mouse",
+            "light_blue_cube",
+            "blue_star",
+            "purple_triangle",
             "pink_cube",
             "measuring_tape",
             "screwdriver",
@@ -141,11 +149,11 @@ def __init__(self, candidate_labels: List[str] = None):
             # "door_handle",
             # "red_ball",
             # "gasket_part",
-            "beer_can",
+            # "beer_can",
             "bowl",
-            "cinder_block",
-            "coke_can",
-            "roomba",
+            # "cinder_block",
+            # "coke_can",
+            # "roomba",
             # "plastic_cup",
             # "hammer",
             # "robotic_arm",
@@ -387,13 +395,16 @@ def classify_all_callback(self, request, response):
             
             response.success = True
             response.message = json.dumps(classification_data, indent=2)
-            
+
             top_pred = classification_data['output']['top_prediction']
             self.get_logger().info(
                 f"Classification complete: {top_pred['label']} "
                 f"(confidence: {top_pred['confidence']:.2f})"
             )
-            
+
+            # Persist result for dashboard
+            self._save_classify_all_record(classification_data, latency_s=(time.perf_counter() - start))
+
         except Exception as e:
             response.success = False
             response.message = json.dumps({
@@ -563,17 +574,31 @@ def classify_bbox_filtered_callback(self, request, response):
                 self.get_logger().error("CLIP model not available")
                 return response
             
-            # Check if we have classified regions from SAM subscription
+            # If no SAM regions cached, trigger a fresh detection + classification now
             if not self.latest_region_classifications:
-                response.success = False
-                response.message = json.dumps({
-                    "error": "No classified regions available. Call '/vision/run_pipeline' first to trigger SAM detection.",
-                    "hint": "ros2 service call /vision/run_pipeline std_srvs/srv/Trigger",
-                    "timestamp": datetime.utcnow().isoformat() + "Z"
-                }, indent=2)
-                self.get_logger().warn("No classified regions. Run SAM pipeline first.")
-                return response
-            
+                self.get_logger().info("No cached regions — calling /vision/detect_objects automatically...")
+                bboxes, err = self._call_detect_objects()
+                if err:
+                    response.success = False
+                    response.message = json.dumps({
+                        "error": err,
+                        "hint": "Ensure simple_sam_detector is running",
+                        "timestamp": datetime.utcnow().isoformat() + "Z"
+                    }, indent=2)
+                    self.get_logger().warn(f"Detection failed: {err}")
+                    return response
+                if not bboxes:
+                    response.success = False
+                    response.message = json.dumps({
+                        "error": "No objects detected in the scene",
+                        "timestamp": datetime.utcnow().isoformat() + "Z"
+                    }, indent=2)
+                    self.get_logger().warn("No bboxes returned from detection")
+                    return response
+                self.get_logger().info(f"Got {len(bboxes)} bboxes from detection — classifying with CLIP...")
+                classification_data = self._classify_regions(self.captured_frame, bboxes)
+                self.latest_region_classifications = classification_data['output']['classified_regions']
+
             self.get_logger().info(f"Filtering {len(self.latest_region_classifications)} classified regions by confidence > 0.5")
             
             # Filter regions by confidence >= 0.5
@@ -602,18 +627,21 @@ def classify_bbox_filtered_callback(self, request, response):
             
             response.success = True
             response.message = json.dumps(result, indent=2)
-            
+
             self.get_logger().info(
                 f"Filtered classification complete: {len(filtered_regions)}/{len(self.latest_region_classifications)} "
                 f"regions passed confidence threshold"
             )
-            
+
             # Log each filtered region
             for region in filtered_regions:
                 self.get_logger().info(
                     f"Region #{region['region_id']}: {region['label']} "
                     f"(confidence: {region['confidence']:.2f})"
                 )
+
+            # Persist to file so benchmark_dashboard can show results in CLIP table
+            self._save_filtered_records(filtered_regions)
             
         except Exception as e:
             response.success = False
@@ -1252,7 +1280,79 @@ def _classify_image(self, rgb_image: np.ndarray) -> Dict:
         }
         
         return schema
-    
+
+    def _save_classify_all_record(self, classification_data: Dict, latency_s: float = 0.0):
+        """Append a /vision/classify_all result to classify_all_history.json for the dashboard."""
+        try:
+            from pathlib import Path
+            history_file = Path(__file__).parent.parent / 'classify_all_history.json'
+            history = []
+            if history_file.exists():
+                try:
+                    with open(history_file, 'r') as f:
+                        history = json.load(f)
+                except Exception:
+                    history = []
+
+            top_pred = classification_data.get('output', {}).get('top_prediction', {})
+            all_preds = classification_data.get('output', {}).get('all_predictions', [])
+            meta = classification_data.get('output', {}).get('metadata', {})
+
+            record = {
+                'call_id': len(history) + 1,
+                'timestamp': datetime.utcnow().isoformat() + 'Z',
+                'top_label': top_pred.get('label', ''),
+                'top_confidence': float(top_pred.get('confidence', 0.0)),
+                'all_predictions': all_preds[:10],  # store top-10
+                'processing_time_ms': meta.get('processing_time_ms', 0),
+                'latency_s': round(latency_s, 4),
+                'device': meta.get('device', ''),
+            }
+
+            history.append(record)
+            # Keep only the last 500 records
+            if len(history) > 500:
+                history = history[-500:]
+
+            with open(history_file, 'w') as f:
+                json.dump(history, f, indent=2)
+        except Exception as e:
+            self.get_logger().warn(f'Failed to save classify_all record: {e}')
+
+    def _save_filtered_records(self, filtered_regions: list):
+        """Append /vision/classify_bbox_filtered results to classify_filtered_history.json.
+        Each region becomes one record in the format the dashboard CLIP table expects."""
+        try:
+            from pathlib import Path
+            history_file = Path(__file__).parent.parent / 'classify_filtered_history.json'
+            history = []
+            if history_file.exists():
+                try:
+                    with open(history_file, 'r') as f:
+                        history = json.load(f)
+                except Exception:
+                    history = []
+
+            timestamp = datetime.utcnow().isoformat() + 'Z'
+            call_id_base = len(history) + 1
+            for i, region in enumerate(filtered_regions):
+                history.append({
+                    'test_id': call_id_base + i,
+                    'timestamp': timestamp,
+                    'label': region['label'],
+                    'confidence': float(region['confidence']),
+                    'top1_accuracy': None,  # set by human-in-the-loop verdict
+                    'bbox': region.get('bbox', {}),
+                })
+
+            if len(history) > 1000:
+                history = history[-1000:]
+
+            with open(history_file, 'w') as f:
+                json.dump(history, f, indent=2)
+        except Exception as e:
+            self.get_logger().warn(f'Failed to save filtered records: {e}')
+
     def _classify_regions(self, rgb_image: np.ndarray, bboxes: List[List[int]]) -> Dict:
         """
         Classify multiple image regions using CLIP model
diff --git a/vision/obb_angle_service_node.py b/vision/obb_angle_service_node.py
index 649ee0b..0518fa8 100644
--- a/vision/obb_angle_service_node.py
+++ b/vision/obb_angle_service_node.py
@@ -42,10 +42,13 @@
 from custom_interfaces.msg import SAMDetections
 from sensor_msgs.msg import Image, CameraInfo
 from cv_bridge import CvBridge
+import json
 import numpy as np
 import cv2
 import time
 import threading
+from datetime import datetime
+from pathlib import Path
 
 
 class OBBAngleServiceNode(Node):
@@ -715,20 +718,34 @@ def find_object_angle_bb_callback(self, request, response):
             theta_result = np.deg2rad(angle_result_deg)
 
             # Populate response (use remapped theta, keep geometry unchanged)
+            angle_deg = angle_result_deg
             response.success = True
-            response.message = f'OBB calculated for {best_detection.object_id} within bbox [{request.x1}, {request.y1}, {request.x2}, {request.y2}]'
+            response.message = json.dumps({
+                "success": True,
+                "object_id": best_detection.object_id,
+                "input_bbox": [request.x1, request.y1, request.x2, request.y2],
+                "center": {"u": round(u, 2), "v": round(v, 2)},
+                "theta_rad": round(float(theta_result), 6),
+                "angle_deg": round(float(angle_deg), 2),
+                "width_px": round(float(width), 2),
+                "height_px": round(float(height), 2),
+                "iou_with_request": round(float(best_iou), 4),
+                "timestamp": datetime.utcnow().isoformat() + "Z",
+            })
             response.u = u
             response.v = v
             response.theta = theta_result
             response.width = width
             response.height = height
-            
+
             # Log results concisely
-            angle_deg = angle_result_deg
             self.get_logger().info('=' * 60)
             self.get_logger().info(f'OBB Result ({best_detection.object_id}): center=({u:.1f},{v:.1f}), angle={angle_deg:.1f}deg, size={width:.0f}x{height:.0f}')
             self.get_logger().info('=' * 60)
-            
+
+            # Persist to history file for dashboard
+            self._save_obb_bb_record(best_detection.object_id, request, u, v, theta_result, angle_deg, width, height, best_iou)
+
             # Queue visualization; do not block service response path.
             viz_data = [(best_detection.object_id, u, v, theta_geom, width, height, [request.x1, request.y1, request.x2, request.y2])]
             self.queue_visualization(viz_data, mode="single")
@@ -738,15 +755,50 @@ def find_object_angle_bb_callback(self, request, response):
             import traceback
             self.get_logger().error(traceback.format_exc())
             response.success = False
-            response.message = f'Internal error: {str(e)}'
+            response.message = json.dumps({"success": False, "error": str(e)})
             response.u = 0.0
             response.v = 0.0
             response.theta = 0.0
             response.width = 0.0
             response.height = 0.0
-        
+
         return response
-    
+
+    def _save_obb_bb_record(self, object_id, request, u, v, theta_rad, angle_deg, width, height, iou):
+        """Persist /obb/find_object_angle_bb result to obb_bb_history.json for the dashboard."""
+        try:
+            history_file = Path(__file__).parent.parent / 'obb_bb_history.json'
+            history = []
+            if history_file.exists():
+                try:
+                    with open(history_file, 'r') as f:
+                        history = json.load(f)
+                except Exception:
+                    history = []
+
+            record = {
+                'call_id': len(history) + 1,
+                'timestamp': datetime.utcnow().isoformat() + 'Z',
+                'object_id': object_id,
+                'input_bbox': [request.x1, request.y1, request.x2, request.y2],
+                'center_u': round(float(u), 2),
+                'center_v': round(float(v), 2),
+                'theta_rad': round(float(theta_rad), 6),
+                'angle_deg': round(float(angle_deg), 2),
+                'width_px': round(float(width), 2),
+                'height_px': round(float(height), 2),
+                'iou': round(float(iou), 4),
+            }
+
+            history.append(record)
+            if len(history) > 500:
+                history = history[-500:]
+
+            with open(history_file, 'w') as f:
+                json.dump(history, f, indent=2)
+        except Exception as e:
+            self.get_logger().warn(f'Failed to save obb_bb record: {e}')
+
     def find_object_angle_callback(self, request, response):
         """
         Service callback for /obb/find_object_angle

From 3fdf50c936dfe69c86836f99a20859d8fdd9acb0 Mon Sep 17 00:00:00 2001
From: Kanisorn-S <karamahati@gmail.com>
Date: Sat, 11 Apr 2026 21:57:07 +0700
Subject: [PATCH 16/16] feat: add test for clip in dashboard and fix path clip
 issue dashboard

---
 test/test_clip_filtered_dashboard.py | 184 +++++++++++++++++++++++++++
 1 file changed, 184 insertions(+)
 create mode 100644 test/test_clip_filtered_dashboard.py

diff --git a/test/test_clip_filtered_dashboard.py b/test/test_clip_filtered_dashboard.py
new file mode 100644
index 0000000..995b5a0
--- /dev/null
+++ b/test/test_clip_filtered_dashboard.py
@@ -0,0 +1,184 @@
+#!/usr/bin/env python3
+"""
+Unit tests: verify classify_filtered_history.json path, format, and HTTP endpoint.
+
+Run directly (no ROS needed):
+    python3 test/test_clip_filtered_dashboard.py
+"""
+
+import json
+import unittest
+import urllib.request
+import urllib.error
+from pathlib import Path
+
+# ── Path constants ────────────────────────────────────────────────────────────
+INSTALL_VISION = Path(
+    '/home/group11/final_project_ws/install/vision'
+    '/lib/python3.12/site-packages/vision'
+)
+INSTALL_PKG    = INSTALL_VISION.parent          # site-packages/
+SRC_VISION     = Path(
+    '/home/group11/final_project_ws/src/vision/vision'
+)
+SRC_PKG        = SRC_VISION.parent              # src/vision/
+
+DASHBOARD_URL  = 'http://localhost:8080'
+
+
+def _resolve_package_path(py_file: Path) -> Path:
+    """Replicate Path(__file__).parent.parent used in the nodes."""
+    return py_file.parent.parent
+
+
+class TestPathConsistency(unittest.TestCase):
+    """Writer and reader must resolve to the same JSON file."""
+
+    def test_install_clip_and_dashboard_same_path(self):
+        clip_path = _resolve_package_path(INSTALL_VISION / 'clip_classifier.py') \
+                    / 'classify_filtered_history.json'
+        dash_path = _resolve_package_path(INSTALL_VISION / 'benchmark_dashboard.py') \
+                    / 'classify_filtered_history.json'
+        self.assertEqual(clip_path, dash_path,
+            f"clip writes to {clip_path} but dashboard reads from {dash_path}")
+
+    def test_src_and_install_expected_dir(self):
+        """Install package_path == site-packages, NOT src/vision."""
+        install_pkg_path = _resolve_package_path(INSTALL_VISION / 'clip_classifier.py')
+        self.assertIn('site-packages', str(install_pkg_path),
+            f"install path looks wrong: {install_pkg_path}")
+
+    def test_filtered_file_exists(self):
+        fpath = INSTALL_PKG / 'classify_filtered_history.json'
+        self.assertTrue(fpath.exists(),
+            f"classify_filtered_history.json not found at {fpath}")
+
+
+class TestFilteredFileFormat(unittest.TestCase):
+    """Each record must have the fields the dashboard expects."""
+
+    @classmethod
+    def setUpClass(cls):
+        fpath = INSTALL_PKG / 'classify_filtered_history.json'
+        if fpath.exists():
+            with open(fpath) as f:
+                cls.records = json.load(f)
+        else:
+            cls.records = []
+
+    def test_file_not_empty(self):
+        self.assertGreater(len(self.records), 0,
+            "classify_filtered_history.json is empty – call "
+            "/vision/classify_bbox_filtered first")
+
+    def test_required_fields_present(self):
+        required = {'test_id', 'timestamp', 'label', 'confidence', 'top1_accuracy', 'bbox'}
+        for i, rec in enumerate(self.records[:5]):
+            missing = required - rec.keys()
+            self.assertFalse(missing,
+                f"Record #{i} missing fields: {missing}\nRecord: {rec}")
+
+    def test_confidence_is_float_in_range(self):
+        for i, rec in enumerate(self.records[:20]):
+            c = rec.get('confidence')
+            self.assertIsInstance(c, float,
+                f"Record #{i}: confidence should be float, got {type(c)}")
+            self.assertGreaterEqual(c, 0.0)
+            self.assertLessEqual(c, 1.0)
+
+    def test_top1_accuracy_is_null_or_bool(self):
+        for i, rec in enumerate(self.records):
+            acc = rec.get('top1_accuracy')
+            self.assertIn(type(acc), (type(None), bool),
+                f"Record #{i}: top1_accuracy should be None or bool, got {type(acc)}: {acc}")
+
+    def test_bbox_is_list_or_dict(self):
+        for i, rec in enumerate(self.records[:10]):
+            bbox = rec.get('bbox')
+            self.assertIsNotNone(bbox, f"Record #{i}: bbox is None")
+            self.assertIn(type(bbox), (list, dict),
+                f"Record #{i}: bbox type {type(bbox)}")
+
+    def test_no_auto_true_verdicts_in_new_records(self):
+        """Records saved after the human-in-the-loop fix should have top1_accuracy=None."""
+        # Find the most recent record – should be null, not auto-True
+        if not self.records:
+            self.skipTest("No records to check")
+        last = self.records[-1]
+        self.assertIsNone(last.get('top1_accuracy'),
+            f"Latest record has auto-verdict instead of null: {last}")
+
+
+class TestHTTPEndpoint(unittest.TestCase):
+    """Verify the dashboard HTTP server exposes /api/classify-filtered-history."""
+
+    def _get(self, path):
+        try:
+            with urllib.request.urlopen(DASHBOARD_URL + path, timeout=5) as r:
+                return r.status, json.loads(r.read())
+        except urllib.error.HTTPError as e:
+            return e.code, None
+        except Exception as e:
+            self.skipTest(f"Dashboard not reachable ({e})")
+
+    def test_endpoint_exists_returns_200(self):
+        status, data = self._get('/api/classify-filtered-history')
+        self.assertEqual(status, 200,
+            f"/api/classify-filtered-history returned {status} – endpoint missing or not deployed")
+
+    def test_endpoint_returns_list(self):
+        status, data = self._get('/api/classify-filtered-history')
+        if status != 200:
+            self.skipTest(f"Endpoint returned {status}")
+        self.assertIsInstance(data, list,
+            f"Expected list, got {type(data)}")
+
+    def test_endpoint_data_matches_file(self):
+        fpath = INSTALL_PKG / 'classify_filtered_history.json'
+        if not fpath.exists():
+            self.skipTest("classify_filtered_history.json not found")
+        with open(fpath) as f:
+            file_records = json.load(f)
+
+        status, http_records = self._get('/api/classify-filtered-history')
+        if status != 200:
+            self.skipTest(f"Endpoint returned {status}")
+
+        self.assertEqual(len(file_records), len(http_records),
+            f"File has {len(file_records)} records but endpoint returned {len(http_records)}")
+
+    def test_api_data_merges_filtered(self):
+        """fetchData() merges clip_classifications + filtered; verify /api/data exists."""
+        status, data = self._get('/api/data')
+        if status != 200:
+            self.skipTest("/api/data not reachable")
+        self.assertIn('clip_classifications', data,
+            "clip_classifications key missing from /api/data")
+
+    def test_clip_verdict_endpoint_accessible(self):
+        """POST /api/clip-verdict must return 4xx for bad payload, not 404."""
+        try:
+            req = urllib.request.Request(
+                DASHBOARD_URL + '/api/clip-verdict',
+                data=b'{}',
+                headers={'Content-Type': 'application/json'},
+                method='POST'
+            )
+            with urllib.request.urlopen(req, timeout=5) as r:
+                status = r.status
+        except urllib.error.HTTPError as e:
+            status = e.code
+        except Exception as e:
+            self.skipTest(f"Dashboard not reachable ({e})")
+
+        self.assertNotEqual(status, 404,
+            "/api/clip-verdict returned 404 – endpoint not deployed in running process")
+        self.assertIn(status, (200, 400),
+            f"Unexpected status {status} for /api/clip-verdict")
+
+
+if __name__ == '__main__':
+    print("=" * 60)
+    print("CLIP Filtered Dashboard – Path & Endpoint Tests")
+    print("=" * 60)
+    unittest.main(verbosity=2)