Add vizualization

luxonis · sokovninn · Nov 12, 2024 · Apr 29, 2024 · Apr 29, 2024 · May 8, 2024
commit 454d749a1496ac782cda2473a9c226387ad36ba2
diff --git a/datadreamer/pipelines/generate_dataset_from_scratch.py b/datadreamer/pipelines/generate_dataset_from_scratch.py
@@ -651,16 +651,13 @@ def read_image_batch(image_batch, batch_num, batch_size):
                     box = boxes_batch[j][k]
                     score = scores_batch[j][k]
                     label = local_labels_batch[j][k]
+
                     if args.task == "instance-segmentation":
                         if k < len(masks_batch[j]):
                             mask = masks_batch[j][k]
-                            # Unzip the list of points into separate x and y lists
                             x_points, y_points = zip(*mask)
 
-                            # Fill the polygon defined by the points to create the mask
-                            ax.fill(
-                                x_points, y_points, "blue", alpha=0.5
-                            )  # 'blue' for mask color and alpha for transparency
+                            ax.fill(x_points, y_points, "blue", alpha=0.5)
 
                     labels.append(label)
                     x1, y1, x2, y2 = box

diff --git a/datadreamer/utils/coco_converter.py b/datadreamer/utils/coco_converter.py
@@ -128,6 +128,7 @@ def process_data(
                 ):
                     bbox = [box[0], box[1], box[2] - box[0], box[3] - box[1]]
                     segmentation = (
+                        # (np.array(mask)*np.array([image_width, image_height])).reshape(-1).tolist()
                         np.array(mask).reshape(-1).tolist()
                         if mask is not None
                         else None

diff --git a/datadreamer/utils/luxonis_dataset_converter.py b/datadreamer/utils/luxonis_dataset_converter.py
@@ -86,16 +86,19 @@ def dataset_generator():
                     }
 
                 if "masks" in data[image_path]:  # polyline format
-                    poly = []
                     masks = data[image_path]["masks"]
-                    for m in masks:
-                        poly = [[point[0] / width, point[1] / height] for point in m]
+                    for mask, label in zip(masks, labels):
+                        poly = []
+                        for m in mask:
+                            poly += [
+                                (point[0] / width, point[1] / height) for point in m
+                            ]
                         yield {
                             "file": image_full_path,
                             "annotation": {
                                 "type": "polyline",
                                 "class": class_names[label],
-                                "points": poly,
+                                "points": poly,  # masks,
                             },
                         }
 

diff --git a/datadreamer/utils/yolo_converter.py b/datadreamer/utils/yolo_converter.py
@@ -4,6 +4,7 @@
 import shutil
 from typing import Dict, List
 
+import numpy as np
 from PIL import Image
 
 from datadreamer.utils import BaseConverter
@@ -76,24 +77,26 @@ def convert_to_yolo_format(
         return [x_center, y_center, width, height]
 
     def convert_masks_to_yolo_format(
-        self, masks: List[List[float]], image_width: int, image_height: int
+        self, masks: List[List[float]], w: int, h: int
     ) -> List[float]:
         """Converts masks to YOLO format.
 
         Args:
             masks (list of list of float): A list containing the masks.
-            image_width (int): The width of the image.
-            image_height (int): The height of the image.
+            w (int): The width of the image.
+            h (int): The height of the image.
 
         Returns:
             list of float: A list containing the masks in YOLO format.
         """
-        yolo_masks = []
-        for mask in masks:
-            x, y = mask[0], mask[1]
-            yolo_masks.append(x / image_width)
-            yolo_masks.append(y / image_height)
-        return yolo_masks
+        # yolo_masks = []
+        # for mask in masks:
+        #     x, y = mask[0], mask[1]
+        #     yolo_masks.append(x / image_width)
+        #     yolo_masks.append(y / image_height)
+        # return yolo_masks
+        return (np.array(masks) / np.array([w, h])).reshape(-1).tolist()
+        # return np.array(masks).reshape(-1).tolist()
 
     def process_data(
         self,

diff --git a/examples/generate_instance_segmentation_dataset_and_train_yolo.ipynb b/examples/generate_instance_segmentation_dataset_and_train_yolo.ipynb
@@ -270,6 +270,9 @@
    },
    "outputs": [],
    "source": [
+    "import os\n",
+    "os.environ['WANDB_DISABLED'] = 'true'\n",
+    "\n",
     "results = model.train(data=\"generated_dataset_yolo/data.yaml\", epochs=50)"
    ]
   },

diff --git a/examples/visualize_detection_dataset.py b/examples/visualize_detection_dataset.py
@@ -3,9 +3,10 @@
 import os
 
 import cv2
+import numpy as np
 
 
-def draw_rounded_rectangle(img, pt1, pt2, color, thickness, r, d):
+def draw_rounded_rectangle(img, pt1, pt2, color, thickness, r, masks=None):
     x1, y1 = pt1
     x2, y2 = pt2
 
@@ -24,6 +25,13 @@ def draw_rounded_rectangle(img, pt1, pt2, color, thickness, r, d):
     cv2.ellipse(img, (x2 - r, y2 - r), (r, r), 0, 0, 90, color, thickness)
 
 
+def draw_mask(image, mask, color, alpha=0.5):
+    overlay = image.copy()
+    mask = np.array([[int(p[0]), int(p[1])] for p in mask])
+    cv2.fillPoly(overlay, [mask], color)
+    cv2.addWeighted(overlay, alpha, image, 1 - alpha, 0, image)
+
+
 def draw_bboxes_and_labels(image, annotations, class_names):
     font = cv2.FONT_HERSHEY_SIMPLEX
     font_scale = 1.5  # Increased font size
@@ -32,7 +40,10 @@ def draw_bboxes_and_labels(image, annotations, class_names):
     text_color = (255, 255, 255)  # White text
     rectangle_radius = 8
 
-    for bbox, label in zip(annotations["boxes"], annotations["labels"]):
+    for i in range(len(annotations["boxes"])):
+        bbox = annotations["boxes"][i]
+        label = annotations["labels"][i]
+
         x_min, y_min, x_max, y_max = map(int, bbox)
         label_text = class_names[label]
 
@@ -54,6 +65,10 @@ def draw_bboxes_and_labels(image, annotations, class_names):
             1,
         )
 
+        if "masks" in annotations:
+            masks = annotations["masks"][i]
+            draw_mask(image, masks, (0, 255, 0), 0.5)
+
         # Draw text background
         draw_rounded_rectangle(
             image,
@@ -89,7 +104,7 @@ def visualize_dataset(dataset_dir, save_images):
 
     for image_name, annotations in all_annotations.items():
         image_path = image_name
-        image = cv2.imread(image_path)
+        image = cv2.imread(os.path.join(dataset_dir, image_path))
         image = draw_bboxes_and_labels(image, annotations, class_names)
 
         if save_images: