luxonis
diff --git a/‎luxonis_ml/data/datasets/luxonis_dataset.py‎
Lines changed: 8 additions & 5 deletions b/‎luxonis_ml/data/datasets/luxonis_dataset.py‎
Lines changed: 8 additions & 5 deletions
diff --git a/‎luxonis_ml/data/exporters/__init__.py‎
Lines changed: 6 additions & 0 deletions b/‎luxonis_ml/data/exporters/__init__.py‎
Lines changed: 6 additions & 0 deletions
diff --git a/‎luxonis_ml/data/exporters/exporter_utils.py‎
Lines changed: 39 additions & 59 deletions b/‎luxonis_ml/data/exporters/exporter_utils.py‎
Lines changed: 39 additions & 59 deletions
diff --git a/‎luxonis_ml/data/exporters/yolov8_exporter.py‎
Lines changed: 0 additions & 6 deletions b/‎luxonis_ml/data/exporters/yolov8_exporter.py‎
Lines changed: 0 additions & 6 deletions
diff --git a/‎luxonis_ml/data/exporters/yolov8_instance_segmentation_exporter.py‎
Lines changed: 186 additions & 0 deletions b/‎luxonis_ml/data/exporters/yolov8_instance_segmentation_exporter.py‎
Lines changed: 186 additions & 0 deletions
@@ -31,6 +31,8 @@
     YoloV4Exporter,
     YoloV6Exporter,
     YoloV8Exporter,
+    YoloV8InstanceSegmentationExporter,
+    YoloV8KeypointsExporter,
 )
 from luxonis_ml.data.exporters.exporter_utils import (
     ExporterSpec,
@@ -1528,11 +1530,12 @@ def export(
                     "skeletons": getattr(self.metadata, "skeletons", None),
                 },
             ),
-            DatasetType.YOLOV8: ExporterSpec(
-                YoloV8Exporter,
-                {
-                    "skeletons": getattr(self.metadata, "skeletons", None),
-                },
+            DatasetType.YOLOV8: ExporterSpec(YoloV8Exporter, {}),
+            DatasetType.YOLOV8INSTANCESEGMENTATION: ExporterSpec(
+                YoloV8InstanceSegmentationExporter, {}
+            ),
+            DatasetType.YOLOV8KEYPOINTS: ExporterSpec(
+                YoloV8KeypointsExporter, {}
             ),
             DatasetType.YOLOV6: ExporterSpec(YoloV6Exporter, {}),
             DatasetType.YOLOV4: ExporterSpec(YoloV4Exporter, {}),
 
@@ -13,6 +13,10 @@
 from .yolov4_exporter import YoloV4Exporter
 from .yolov6_exporter import YoloV6Exporter
 from .yolov8_exporter import YoloV8Exporter
+from .yolov8_instance_segmentation_exporter import (
+    YoloV8InstanceSegmentationExporter,
+)
+from .yolov8_keypoints_exporter import YoloV8KeypointsExporter
 
 __all__ = [
     "BaseExporter",
@@ -28,4 +32,6 @@
     "YoloV4Exporter",
     "YoloV6Exporter",
     "YoloV8Exporter",
+    "YoloV8InstanceSegmentationExporter",
+    "YoloV8KeypointsExporter",
 ]
@@ -7,7 +7,7 @@
 import numpy as np
 import polars as pl
 from loguru import logger
-from pycocotools import mask
+from pycocotools import mask as maskUtils
 
 if TYPE_CHECKING:
     from luxonis_ml.data.datasets.luxonis_dataset import LuxonisDataset
@@ -181,55 +181,6 @@ def get_single_skeleton(
         skeleton_1_based = [[a + 1, b + 1] for a, b in edges]
         return labels, skeleton_1_based
 
-    @staticmethod
-    def rle_to_yolo_polygon(rle: str, height: int, width: int) -> list:
-        # Decode RLE to binary mask
-        m = mask.decode({"size": [height, width], "counts": rle})
-
-        # Each contour = one polygon
-        contours, _ = cv2.findContours(
-            m, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE
-        )
-
-        polygons = []
-        for contour in contours:
-            contour = contour.squeeze()
-            if len(contour.shape) != 2:
-                continue
-            polygon = []
-            for x, y in contour:
-                polygon.extend([x / width, y / height])
-            polygons.append(polygon)
-
-        return polygons
-
-    @staticmethod
-    def _bbox_from_poly(
-        coords: list[float],
-    ) -> tuple[float, float, float, float]:
-        xs = coords[0::2]
-        ys = coords[1::2]
-        x_min, x_max = min(xs), max(xs)
-        y_min, y_max = min(ys), max(ys)
-        return x_min, y_min, (x_max - x_min), (y_max - y_min)
-
-    @staticmethod
-    def _iou_xywh(
-        a: tuple[float, float, float, float],
-        b: tuple[float, float, float, float],
-    ) -> float:
-        ax, ay, aw, ah = a
-        bx, by, bw, bh = b
-        ax2, ay2 = ax + aw, ay + ah
-        bx2, by2 = bx + bw, by + bh
-        inter_w = max(0.0, min(ax2, bx2) - max(ax, bx))
-        inter_h = max(0.0, min(ay2, by2) - max(ay, by))
-        inter = inter_w * inter_h
-        if inter <= 0.0:
-            return 0.0
-        union = aw * ah + bw * bh - inter
-        return inter / union if union > 0.0 else 0.0
-
     @staticmethod
     def decode_rle_with_pycoco(ann: dict[str, Any]) -> np.ndarray:
         h = int(ann["height"])
@@ -239,14 +190,43 @@ def decode_rle_with_pycoco(ann: dict[str, Any]) -> np.ndarray:
         # pycocotools expects an RLE object with 'size' and 'counts'
         rle = {"size": [h, w], "counts": counts.encode("utf-8")}
 
-        m = mask.decode(rle)  # type: ignore[arg-type]
+        m = maskUtils.decode(rle)  # type: ignore[arg-type]
         return np.array(m, dtype=np.uint8, order="C")
 
-    def _normalize(
-        self, xs: list[float], ys: list[float], w: float, h: float
-    ) -> list[float]:
-        out: list[float] = []
-        for x, y in zip(xs, ys, strict=True):
-            out.append(max(0.0, min(1.0, x / w)))
-            out.append(max(0.0, min(1.0, y / h)))
-        return out
+    @staticmethod
+    def annotation_to_polygons(
+        ann: dict[str, Any], file_path: Path
+    ) -> list[list[tuple[float, float]]]:
+        polygons: list[list[tuple[float, float]]] = []
+
+        # COCO RLE -> decode to mask -> contours -> polygons
+        if "counts" in ann:
+            H = int(ann["height"])
+            W = int(ann["width"])
+            rle = {"size": [H, W], "counts": ann["counts"]}
+            try:
+                mask = maskUtils.decode(rle)  # type: ignore
+                if mask.ndim == 3:
+                    mask = mask[:, :, 0]
+                mask = (mask > 0).astype(np.uint8)
+
+                contours, _ = cv2.findContours(
+                    mask, cv2.RETR_EXTERNAL, cv2.CHAIN_APPROX_SIMPLE
+                )
+                for cnt in contours:
+                    if len(cnt) < 3:
+                        continue
+                    cnt = cnt.squeeze(1)
+                    poly = [
+                        (float(x) / W, float(y) / H) for x, y in cnt.tolist()
+                    ]
+                    if len(poly) >= 3:
+                        polygons.append(poly)
+            except Exception:
+                logger.warning(
+                    "Failed to decode COCO RLE; skipping this instance.",
+                    RuntimeWarning,
+                )
+            return polygons
+
+        return polygons
@@ -17,21 +17,16 @@ def __init__(
         dataset_identifier: str,
         output_path: Path,
         max_partition_size_gb: float | None,
-        *,
-        skeletons: dict[str, Any] | None = None,
     ):
         super().__init__(
             dataset_identifier, output_path, max_partition_size_gb
         )
         self.class_to_id: dict[str, int] = {}
         self.class_names: list[str] = []
-        self.skeletons = skeletons  # for later keypoint export implementation
 
-    # v8 uses "val"
     def get_split_names(self) -> dict[str, str]:
         return {"train": "train", "val": "val", "test": "test"}
 
-    # v8 dataset.yaml
     def _yaml_filename(self) -> str:
         return "dataset.yaml"
 
@@ -44,7 +39,6 @@ def transform(self, prepared_ldf: PreparedLDF) -> None:
             prepared_ldf, self.supported_ann_types()
         )
 
-        # dict[split][image_name] -> list of tuples: (cid, ...) bbox or polygon
         annotation_splits: dict[str, dict[str, list[tuple]]] = {
             k: {} for k in self.get_split_names().values()
         }
 
@@ -0,0 +1,186 @@
+from __future__ import annotations
+
+import json
+from pathlib import Path
+from typing import Any, cast
+
+from luxonis_ml.data.exporters.exporter_utils import ExporterUtils, PreparedLDF
+
+from .base_exporter import BaseExporter
+
+
+class YoloV8InstanceSegmentationExporter(BaseExporter):
+    def __init__(
+        self,
+        dataset_identifier: str,
+        output_path: Path,
+        max_partition_size_gb: float | None,
+    ):
+        super().__init__(
+            dataset_identifier, output_path, max_partition_size_gb
+        )
+        self.class_to_id: dict[str, int] = {}
+        self.class_names: list[str] = []
+
+    def get_split_names(self) -> dict[str, str]:
+        return {"train": "train", "val": "val", "test": "test"}
+
+    def _yaml_filename(self) -> str:
+        return "dataset.yaml"
+
+    def supported_ann_types(self) -> list[str]:
+        return ["instance_segmentation"]
+
+    def transform(self, prepared_ldf: PreparedLDF) -> None:
+        ExporterUtils.check_group_file_correspondence(prepared_ldf)
+        ExporterUtils.exporter_specific_annotation_warning(
+            prepared_ldf, self.supported_ann_types()
+        )
+
+        annotation_splits: dict[str, dict[str, list[str]]] = {
+            k: {} for k in self.get_split_names().values()
+        }
+
+        df = prepared_ldf.processed_df
+        grouped = df.group_by(["file", "group_id"], maintain_order=True)
+        copied_files: set[Path] = set()
+
+        for key, group_df in grouped:
+            file_name, group_id = cast(tuple[str, Any], key)
+            logical_split = ExporterUtils.split_of_group(
+                prepared_ldf, group_id
+            )
+            split = self.get_split_names()[logical_split]
+
+            file_path = Path(str(file_name))
+            idx = self.image_indices.setdefault(
+                file_path, len(self.image_indices)
+            )
+            new_name = f"{idx}{file_path.suffix}"
+
+            label_lines: list[str] = []
+
+            for row in group_df.iter_rows(named=True):
+                ttype = row["task_type"]
+                ann_str = row["annotation"]
+                cname = row["class_name"]
+
+                if ann_str is None:
+                    continue
+                if ttype != "instance_segmentation":
+                    continue
+
+                if cname and cname not in self.class_to_id:
+                    self.class_to_id[cname] = len(self.class_to_id)
+                    self.class_names.append(cname)
+                if not cname or cname not in self.class_to_id:
+                    continue
+
+                ann = json.loads(ann_str)
+
+                cid = self.class_to_id[cname]
+                polygons = ExporterUtils.annotation_to_polygons(ann, file_path)
+
+                for poly in polygons:
+                    if len(poly) < 3:
+                        continue
+                    parts = []
+                    for x, y in poly:
+                        x_ = 0.0 if x < 0 else 1.0 if x > 1 else x
+                        y_ = 0.0 if y < 0 else 1.0 if y > 1 else y
+                        parts.append(f"{x_:.12f} {y_:.12f}")
+                    line = f"{cid} " + " ".join(parts)
+                    label_lines.append(line)
+
+            annotation_splits[split][new_name] = label_lines
+
+            ann_size_estimate = sum(len(s) + 1 for s in label_lines)
+            img_size = file_path.stat().st_size
+            annotation_splits = self._maybe_roll_partition(
+                annotation_splits, ann_size_estimate + img_size
+            )
+
+            data_path = self._get_data_path(self.output_path, split, self.part)
+            data_path.mkdir(parents=True, exist_ok=True)
+            dest = data_path / new_name
+            if file_path not in copied_files:
+                copied_files.add(file_path)
+                if dest != file_path:
+                    dest.write_bytes(file_path.read_bytes())
+                self.current_size += img_size
+
+        self._dump_annotations(annotation_splits, self.output_path, self.part)
+
+    def _maybe_roll_partition(
+        self,
+        annotation_splits: dict[str, dict[str, list[str]]],
+        additional_size: int,
+    ) -> dict[str, dict[str, list[str]]]:
+        if (
+            self.max_partition_size
+            and self.part is not None
+            and (self.current_size + additional_size) > self.max_partition_size
+        ):
+            self._dump_annotations(
+                annotation_splits, self.output_path, self.part
+            )
+            self.current_size = 0
+            self.part += 1
+            return {k: {} for k in self.get_split_names().values()}
+        return annotation_splits
+
+    def _dump_annotations(
+        self,
+        annotation_splits: dict[str, dict[str, list[str]]],
+        output_path: Path,
+        part: int | None = None,
+    ) -> None:
+        base = (
+            output_path / f"{self.dataset_identifier}_part{part}"
+            if part is not None
+            else output_path / self.dataset_identifier
+        )
+
+        for split_name in self.get_split_names().values():
+            labels_dir = base / "labels" / split_name
+            labels_dir.mkdir(parents=True, exist_ok=True)
+            images_dir = base / "images" / split_name
+            images_dir.mkdir(parents=True, exist_ok=True)
+
+            for img_name, lines in annotation_splits.get(
+                split_name, {}
+            ).items():
+                (labels_dir / f"{Path(img_name).stem}.txt").write_text(
+                    "\n".join(lines), encoding="utf-8"
+                )
+
+        yaml_filename = self._yaml_filename()
+        if yaml_filename:
+            split_dirs = self.get_split_names()
+            yaml_obj = {
+                "train": str(Path("images") / split_dirs["train"]),
+                "val": str(Path("images") / split_dirs["val"]),
+                "test": str(Path("images") / split_dirs["test"]),
+                "nc": len(self.class_names),
+                "names": self.class_names,
+            }
+            (base / yaml_filename).write_text(
+                self._to_yaml(yaml_obj), encoding="utf-8"
+            )
+
+    def _get_data_path(
+        self, output_path: Path, split: str, part: int | None = None
+    ) -> Path:
+        base = (
+            output_path / f"{self.dataset_identifier}_part{part}"
+            if part is not None
+            else output_path / self.dataset_identifier
+        )
+        return base / "images" / split
+
+    @staticmethod
+    def _to_yaml(d: dict[str, Any]) -> str:
+        lines: list[str] = []
+        for k, v in d.items():
+            lines.append(f"{k}: {v}")
+        return "\n".join(lines) + "\n"