vortexntnu
diff --git a/‎ros/yolo_obb_object_detection/config/yolo_obb_object_detection_params.yaml‎
Lines changed: 4 additions & 4 deletions b/‎ros/yolo_obb_object_detection/config/yolo_obb_object_detection_params.yaml‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎ros/yolo_obb_object_detection/setup.py‎
Lines changed: 0 additions & 1 deletion b/‎ros/yolo_obb_object_detection/setup.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎ros/yolo_object_detection/config/yolo_object_detection_params.yaml‎
Lines changed: 3 additions & 3 deletions b/‎ros/yolo_object_detection/config/yolo_object_detection_params.yaml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎ros/yolo_object_detection/setup.py‎
Lines changed: 0 additions & 1 deletion b/‎ros/yolo_object_detection/setup.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎ros/yolo_segmentation/config/yolo_segmentation_params.yaml‎
Lines changed: 4 additions & 4 deletions b/‎ros/yolo_segmentation/config/yolo_segmentation_params.yaml‎
Lines changed: 4 additions & 4 deletions
diff --git a/‎ros/yolo_segmentation/setup.py‎
Lines changed: 0 additions & 1 deletion b/‎ros/yolo_segmentation/setup.py‎
Lines changed: 0 additions & 1 deletion
diff --git a/‎stonefish_labeling/camera_segmentation/config/camera_segmentation_params.yaml‎
Lines changed: 3 additions & 3 deletions b/‎stonefish_labeling/camera_segmentation/config/camera_segmentation_params.yaml‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎stonefish_labeling/dataset_conversion_scripts/convert_to_yolo.py‎
Lines changed: 10 additions & 2 deletions b/‎stonefish_labeling/dataset_conversion_scripts/convert_to_yolo.py‎
Lines changed: 10 additions & 2 deletions
diff --git a/‎stonefish_labeling/dataset_conversion_scripts/convert_to_yolo_obb.py‎
Lines changed: 241 additions & 0 deletions b/‎stonefish_labeling/dataset_conversion_scripts/convert_to_yolo_obb.py‎
Lines changed: 241 additions & 0 deletions
diff --git a/‎stonefish_labeling/valve_randomizer/launch/valve_randomizer.launch.py‎
Lines changed: 28 additions & 0 deletions b/‎stonefish_labeling/valve_randomizer/launch/valve_randomizer.launch.py‎
Lines changed: 28 additions & 0 deletions
@@ -1,8 +1,8 @@
 /**:
   ros__parameters:
-    model_path: 'obb_best.pt'
-    confidence_threshold: 0.1
-    input_topic: '/realsense/D555_409122300281_Color'
+    model_path: 'best.pt'
+    confidence_threshold: 0.01
+    input_topic: '/camera/camera/color/image_raw'
     output_detections_topic: '/yolo_obb_object_detection/detections'
     output_annotated_topic: '/yolo_obb_object_detection/annotated'
-    device: 'cpu' # Inference device: 'cpu', 0, 1, 'cuda', 'cuda:0', or 'mps' (Mac GPU)
+    device: '0' # Inference device: 'cpu', 0, 1, 'cuda', 'cuda:0', or 'mps' (Mac GPU)
@@ -24,7 +24,6 @@
     maintainer_email='89779148+kluge7@users.noreply.github.com',
     description='YOLO OBB object detection on images, publishing detections and annotated outputs.',
     license='MIT',
-    tests_require=['pytest'],
     entry_points={
         'console_scripts': [
             'yolo_obb_object_detection_node=yolo_obb_object_detection.yolo_obb_object_detection_node:main',
 
@@ -1,8 +1,8 @@
 /**:
   ros__parameters:
-    model_path: 'best.pt'
-    confidence_threshold: 0.1
+    model_path: 'best_simulator.pt'
+    confidence_threshold: 0.5
     input_topic: '/nautilus/front_camera/image_color'
     output_detections_topic: '/yolo_object_detection/detections'
     output_annotated_topic: '/yolo_object_detection/annotated'
-    device: 'cpu' # or '0' for GPU
+    device: '0' # or '0' for GPU
@@ -24,7 +24,6 @@
     maintainer_email='89779148+kluge7@users.noreply.github.com',
     description='YOLO object detection on images, publishing detections and annotated outputs.',
     license='MIT',
-    tests_require=['pytest'],
     entry_points={
         'console_scripts': [
             'yolo_object_detection_node=yolo_object_detection.yolo_object_detection_node:main',
 
@@ -1,7 +1,7 @@
 yolo_segmentation_node:
   ros__parameters:
     # Node parameters
-    input_topic: "/nautilus/down_camera/image_color"
+    input_topic: "/camera/camera/color/image_raw"
     output_bbox_topic: "/pipeline/camera/bboxes"
     output_mask_topic: "/pipeline/camera/segmentation_mask"
     output_debug_topic: "/pipeline/camera/segmentation_debug"
@@ -10,11 +10,11 @@ yolo_segmentation_node:
     pub_debug: True
 
     # Camera info parameters
-    input_camera_info_topic: "/nautilus/down_camera/camera_info"
-    output_camera_info_topic: "/pipeline/camera/camera_info"  # Scaled to match segmentation mask resolution
+    input_camera_info_topic: "/camera/camera/color/camera_info"
+    output_camera_info_topic: "/pipeline/camera/camera_info" # Scaled to match segmentation mask resolution
 
     # Implementation parameters
-    model_path: "yolo26l_sim_and_real.pt"
+    model_path: "mclab-seg-pipe-overfit-hopefully-large-model.pt"
     device: "cuda" # Options: "cpu", "cuda", "cuda:0", "cuda:1", "mps" ++
 
     # Image preprocessing (what ultralytics does):
 
@@ -21,7 +21,6 @@
     maintainer_email='mjengesv@ntnu.no',
     description='ROS 2 package that provides a YOLO-based instance segmentation node (yolo_seg_node) for real-time segmentation.',
     license='MIT',
-    tests_require=['pytest'],
     entry_points={
         'console_scripts': [
             'yolo_seg_node = yolo_segmentation.yolo_seg_node:main',
 
@@ -1,7 +1,7 @@
 /**:
   ros__parameters:
-    segmentation_image_sub_topic: "/front_camera_seg/image_color"
-    color_image_sub_topic:    "/front_camera/image_color"
-    output_dir: /home/jorgen/ros2_ws/src/vortex-deep-learning-pipelines/stonefish_labeling/camera_segmentation/resources
+    segmentation_image_sub_topic: "/nautilus/segmentation_cam/image_color"
+    color_image_sub_topic:    "/nautilus/front_camera/image_color"
+    output_dir: /home/vortex/stonefish_labeling_output_new_new_new
     sync_tolerance_ms: 100 # Timestamps of the two topics from stonefish are not perfectly synced.
                           # This sets the max allowed time offset between the two topics.
@@ -124,7 +124,11 @@ def main():
     if not mask_files:
         mask_files = sorted(seg_dir.glob("*_ids.tiff"))
 
-    for mf in mask_files:
+    total_masks = len(mask_files)
+    print(f"[1/2] Scanning {total_masks} masks to discover class ids...")
+    for i, mf in enumerate(mask_files, 1):
+        if i % 50 == 0 or i == total_masks:
+            print(f"  scanned {i}/{total_masks}")
         ids_raw = cv2.imread(str(mf), cv2.IMREAD_UNCHANGED)
         if ids_raw is None:
             continue
@@ -156,7 +160,11 @@ def main():
     if not front_files:
         front_files = sorted(seg_dir.glob("*.png"))
 
-    for cpath in front_files:
+    total_frames = len(front_files)
+    print(f"[2/2] Converting {total_frames} frames to YOLO labels...")
+    for i, cpath in enumerate(front_files, 1):
+        if i % 50 == 0 or i == total_frames:
+            print(f"  converted {i}/{total_frames}")
         img = cv2.imread(str(cpath), cv2.IMREAD_COLOR)
         stem = cpath.stem
         mask_tiff = seg_dir / f"{stem}_mask.tiff"
 
@@ -0,0 +1,241 @@
+#!/usr/bin/env python3
+import argparse
+import json
+import logging
+import os
+import shutil
+from pathlib import Path
+
+import cv2
+import numpy as np
+import pandas as pd
+
+
+def load_id_to_label(seg_dir: Path) -> dict:
+    json_path = seg_dir / "id_label_map.json"
+    csv_path = seg_dir / "id_label_map.csv"
+    if json_path.exists():
+        raw = json.loads(json_path.read_text(encoding="utf-8"))
+        return {int(k): str(v) for k, v in raw.items()}
+    if csv_path.exists():
+        m = {}
+        for r in pd.read_csv(csv_path).to_dict("records"):
+            m[int(r["id"])] = str(r["label"])
+        return m
+    m = {}
+    legend = seg_dir / "legend.csv"
+    if legend.exists():
+        ids = pd.read_csv(legend)["id"].tolist()
+        for i in ids:
+            if i == 0:
+                m[i] = "background"
+            elif i == 65534:
+                m[i] = "unknown"
+            else:
+                m[i] = f"id_{i}"
+    return m
+
+
+def load_legend_colors(seg_dir: Path) -> dict:
+    legend_path = seg_dir / "legend.csv"
+    colors = {}
+    if not legend_path.exists():
+        return colors
+    df = pd.read_csv(legend_path)
+    for _, row in df.iterrows():
+        try:
+            i = int(row["id"])
+            r = int(row["r"])
+            g = int(row["g"])
+            b = int(row["b"])
+            colors[i] = (r, g, b)
+        except Exception as e:
+            logging.debug("Skipping legend row due to error: %s", e)
+            continue
+    return colors
+
+
+def convert_mask_image_to_ids(ids_img: np.ndarray, legend_colors: dict) -> np.ndarray:
+    if ids_img is None:
+        return None
+    if ids_img.ndim == 2:
+        return ids_img.astype(np.int32)
+    color_to_id = {}
+    for _id, (r, g, b) in legend_colors.items():
+        code = (b & 0xFF) | ((g & 0xFF) << 8) | ((r & 0xFF) << 16)
+        color_to_id[code] = _id
+    flat = ids_img.reshape(-1, ids_img.shape[2])[:, :3]
+    codes = (
+        flat[:, 0].astype(np.uint32)
+        | (flat[:, 1].astype(np.uint32) << 8)
+        | (flat[:, 2].astype(np.uint32) << 16)
+    )
+    mapped = np.full(codes.shape, 65534, dtype=np.int32)
+    for code, _id in color_to_id.items():
+        mapped[codes == code] = _id
+    return mapped.reshape(ids_img.shape[0], ids_img.shape[1])
+
+
+def obb_line_from_mask(
+    mask: np.ndarray, img_w: int, img_h: int, cls_idx: int, axis_aligned: bool = False
+):
+    """Return YOLO-OBB line: 'cls x1 y1 x2 y2 x3 y3 x4 y4' (normalized)."""
+    ys, xs = np.where(mask)
+    if ys.size < 3:
+        return None
+    if axis_aligned:
+        x_min, x_max = float(xs.min()), float(xs.max())
+        y_min, y_max = float(ys.min()), float(ys.max())
+        box = np.array(
+            [[x_min, y_min], [x_max, y_min], [x_max, y_max], [x_min, y_max]],
+            dtype=np.float32,
+        )
+    else:
+        pts = np.stack([xs, ys], axis=1).astype(np.float32)
+        rect = cv2.minAreaRect(pts)
+        box = cv2.boxPoints(rect)
+    coords = []
+    for x, y in box:
+        coords.append(f"{x / img_w:.6f}")
+        coords.append(f"{y / img_h:.6f}")
+    return f"{cls_idx} " + " ".join(coords)
+
+
+def main():
+    ap = argparse.ArgumentParser()
+    ap.add_argument("--seg-dir", required=True)
+    ap.add_argument("--out-dir", required=True)
+    ap.add_argument("--min-pixels", type=int, default=200)
+    ap.add_argument(
+        "--keep-ids",
+        type=str,
+        default="",
+        help="Comma-separated list of ids to keep (e.g. '7'). Empty = keep all.",
+    )
+    ap.add_argument(
+        "--axis-aligned-ids",
+        type=str,
+        default="",
+        help="Comma-separated ids that should get axis-aligned (upright) boxes "
+        "instead of minAreaRect. Still emitted in OBB format.",
+    )
+    args = ap.parse_args()
+
+    keep_ids = (
+        {int(x) for x in args.keep_ids.split(",") if x.strip()}
+        if args.keep_ids
+        else None
+    )
+    axis_aligned_ids = {int(x) for x in args.axis_aligned_ids.split(",") if x.strip()}
+
+    seg_dir = Path(os.path.expanduser(args.seg_dir))
+    out_dir = Path(args.out_dir)
+    (out_dir / "images").mkdir(parents=True, exist_ok=True)
+    (out_dir / "labels").mkdir(parents=True, exist_ok=True)
+
+    id2label = load_id_to_label(seg_dir)
+    legend_colors = load_legend_colors(seg_dir)
+
+    present_ids = set()
+    mask_files = sorted(seg_dir.glob("*_mask.*"))
+    if not mask_files:
+        mask_files = sorted(seg_dir.glob("*_ids.tiff"))
+
+    total_masks = len(mask_files)
+    print(f"[1/2] Scanning {total_masks} masks to discover class ids...")
+    for i, mf in enumerate(mask_files, 1):
+        if i % 50 == 0 or i == total_masks:
+            print(f"  scanned {i}/{total_masks}")
+        ids_raw = cv2.imread(str(mf), cv2.IMREAD_UNCHANGED)
+        if ids_raw is None:
+            continue
+        ids_map = convert_mask_image_to_ids(ids_raw, legend_colors)
+        if ids_map is None:
+            continue
+        uniq, counts = np.unique(ids_map, return_counts=True)
+        for obj_id, cnt in zip(uniq, counts):
+            obj_id = int(obj_id)
+            if obj_id in (0, 65534):
+                continue
+            if keep_ids is not None and obj_id not in keep_ids:
+                continue
+            if int(cnt) >= args.min_pixels:
+                present_ids.add(obj_id)
+
+    class_ids = sorted(present_ids)
+    classes = [id2label.get(obj_id, f"id_{obj_id}") for obj_id in class_ids]
+    (out_dir / "classes.txt").write_text("\n".join(classes), encoding="utf-8")
+    id2idx = {cid: i for i, cid in enumerate(class_ids)}
+
+    front_files = sorted(seg_dir.glob("frame_*.png"))
+    if not front_files:
+        front_files = sorted(seg_dir.glob("*.png"))
+
+    total_frames = len(front_files)
+    print(f"[2/2] Converting {total_frames} frames to YOLO-OBB labels...")
+    for i, cpath in enumerate(front_files, 1):
+        if i % 50 == 0 or i == total_frames:
+            print(f"  converted {i}/{total_frames}")
+        img = cv2.imread(str(cpath), cv2.IMREAD_COLOR)
+        stem = cpath.stem
+        mask_tiff = seg_dir / f"{stem}_mask.tiff"
+        mask_png = seg_dir / f"{stem}_mask.png"
+        if mask_tiff.exists():
+            ids_raw = cv2.imread(str(mask_tiff), cv2.IMREAD_UNCHANGED)
+        elif mask_png.exists():
+            ids_raw = cv2.imread(str(mask_png), cv2.IMREAD_UNCHANGED)
+        else:
+            legacy = seg_dir / f"{stem}_ids.tiff"
+            ids_raw = (
+                cv2.imread(str(legacy), cv2.IMREAD_UNCHANGED)
+                if legacy.exists()
+                else None
+            )
+
+        if ids_raw is None or img is None:
+            print(f"WARNING: Skipping {cpath.name} (failed to read front or mask)")
+            continue
+
+        ids = convert_mask_image_to_ids(ids_raw, legend_colors)
+        if ids is None:
+            continue
+
+        h, w = ids.shape[:2]
+        uniq, counts = np.unique(ids, return_counts=True)
+
+        lines = []
+        for obj_id, count in zip(uniq, counts):
+            obj_id = int(obj_id)
+            if obj_id in (0, 65534):
+                continue
+            if count < args.min_pixels:
+                continue
+            if obj_id not in id2idx:
+                continue
+            mask = ids == obj_id
+            line = obb_line_from_mask(
+                mask, w, h, id2idx[obj_id], axis_aligned=obj_id in axis_aligned_ids
+            )
+            if line is not None:
+                lines.append(line)
+
+        label_path = out_dir / "labels" / (stem + ".txt")
+        label_path.write_text("\n".join(lines), encoding="utf-8")
+
+        try:
+            shutil.copy2(cpath, out_dir / "images" / cpath.name)
+        except Exception as e:
+            logging.debug("Failed to copy image %s: %s", cpath, e)
+
+    yaml = [
+        f"path: {out_dir.resolve()}",
+        "train: images",
+        "val: images",
+        f"names: {classes}",
+    ]
+    (out_dir / "data.yaml").write_text("\n".join(yaml), encoding="utf-8")
+    print(f"Done. Exported to: {out_dir}")
+
+
+if __name__ == "__main__":
+    main()
@@ -0,0 +1,28 @@
+from launch import LaunchDescription
+from launch.actions import DeclareLaunchArgument
+from launch.substitutions import LaunchConfiguration
+from launch_ros.actions import Node
+
+
+def generate_launch_description() -> LaunchDescription:
+    return LaunchDescription(
+        [
+            DeclareLaunchArgument("period", default_value="5.0"),
+            DeclareLaunchArgument("min_angle", default_value="-1.57"),
+            DeclareLaunchArgument("max_angle", default_value="1.57"),
+            Node(
+                package="valve_randomizer",
+                executable="valve_randomizer_node",
+                name="valve_randomizer",
+                output="screen",
+                parameters=[
+                    {
+                        "valves": ["valve1", "valve2"],
+                        "period": LaunchConfiguration("period"),
+                        "min_angle": LaunchConfiguration("min_angle"),
+                        "max_angle": LaunchConfiguration("max_angle"),
+                    }
+                ],
+            ),
+        ]
+    )