Visual-Behavior · thibo73800 · Sep 9, 2021 · Sep 7, 2021 · Sep 7, 2021 · Sep 7, 2021
diff --git a/alodataset/coco_detection_dataset.py b/alodataset/coco_detection_dataset.py
@@ -3,10 +3,9 @@
 in a :mod:`Frame object <aloscene.frame>`. Ideal for object detection applications.
 """
 
-import logging
-
 import torch
 import torch.utils.data
+from pycocotools.coco import COCO
 from pycocotools import mask as coco_mask
 import numpy as np
 import os
@@ -16,7 +15,7 @@
 from torchvision.datasets.coco import CocoDetection
 
 from alodataset import BaseDataset
-from aloscene import BoundingBoxes2D, Frame, Labels
+from aloscene import BoundingBoxes2D, Frame, Labels, Mask
 
 
 class CocoDetectionSample(CocoDetection):
@@ -34,48 +33,51 @@ def __init__(
         name: str = "coco",
         return_masks=False,
         classes: list = None,
+        stuff_ann_file: str = None,
         **kwargs,
     ):
         """
-        Attributes
-        ----------
-        CATEGORIES : set
-            List of all unique tags read from the database
-        labels_names : list
-            List of labels according to their corresponding positions
-        prepare : :mod:`BaseDataset <base_dataset>`
+    Attributes
+    ----------
+    CATEGORIES : set
+        List of all unique tags read from the database
+    labels_names : list
+        List of labels according to their corresponding positions
+    prepare : :mod:`BaseDataset <base_dataset>`
 
-        Parameters
-        ----------
-        img_folder : str
-            Path to the image folder relative at `dataset_dir` (stored into the aloception config file)
-        ann_file : str
-            Path to the annotation file relative at `dataset_dir` (stored into the aloception config file)
-        name : str, optional
-            Key of database name in `alodataset_config.json` file, by default *coco*
-        return_masks : bool, optional
-            Include masks labels in the output, by default False
-        classes : list, optional
-            List of classes to be filtered in the annotation reading process, by default None
-        **kwargs : dict
-            :mod:`BaseDataset <base_dataset>` optional parameters
-
-        Raises
-        ------
-        Exception
-            If a classes list is decided, each label must be inside of :attr:`CATEGORIES` list attribute
-
-        Examples
-        --------
-            >>> coco_ds = CocoDetectionDataset(
-            ... img_folder = "val2017",
-            ... ann_file = "annotations/instances_val2017.json",
-            ... mode = "validation"
-            )
-            >>> frames = next(iter(coco_ds.train_loader()))
-            >>> frames = frames[0].batch_list(frames)
-            >>> frames.get_view(frames.boxes2d,).render()
-        """
+    Parameters
+    ----------
+    img_folder : str
+        Path to the image folder relative at `dataset_dir` (stored into the aloception config file)
+    ann_file : str
+        Path to the annotation file relative at `dataset_dir` (stored into the aloception config file)
+    name : str, optional
+        Key of database name in `alodataset_config.json` file, by default *coco*
+    return_masks : bool, optional
+        Include masks labels in the output, by default False
+    classes : list, optional
+        List of classes to be filtered in the annotation reading process, by default None
+    stuff_ann_file: str, optional
+        Additional annotations with new classes, by default None
+    **kwargs : dict
+        :mod:`BaseDataset <base_dataset>` optional parameters
+
+    Raises
+    ------
+    Exception
+        If a classes list is decided, each label must be inside of :attr:`CATEGORIES` list attribute
+
+    Examples
+    --------
+        >>> coco_ds = CocoDetectionDataset(
+        ... img_folder = "val2017",
+        ... ann_file = "annotations/instances_val2017.json",
+        ... mode = "validation"
+        )
+        >>> frames = next(iter(coco_ds.train_loader()))
+        >>> frames = frames[0].batch_list(frames)
+        >>> frames.get_view(frames.boxes2d,).render()
+    """
 
         if "sample" not in kwargs:
             kwargs["sample"] = False
@@ -88,17 +90,25 @@ def __init__(
             dataset_dir = BaseDataset.get_dataset_dir(self)
             img_folder = os.path.join(dataset_dir, img_folder)
             ann_file = os.path.join(dataset_dir, ann_file)
+            stuff_ann_file = None if stuff_ann_file is None else os.path.join(dataset_dir, stuff_ann_file)
 
         self.sample = kwargs["sample"]
         super(CocoDetectionDataset, self).__init__(name=name, root=img_folder, annFile=ann_file, **kwargs)
         if self.sample:
             return
 
         cats = self.coco.loadCats(self.coco.getCatIds())
+        self.coco_stuff = None
+        if stuff_ann_file is not None:
+            self.coco_stuff = COCO(stuff_ann_file)
+            cats += self.coco_stuff.loadCats(self.coco_stuff.getCatIds())
 
         # Setup the class names
         nb_category = max(cat["id"] for cat in cats)
         self.CATEGORIES = set([cat["name"] for cat in cats])
+        # aux = set([x.split("-")[0] for x in self.CATEGORIES])
+        # print(aux, len(aux))
+        # print(set([cat["supercategory"] for cat in cats]), len(set([cat["supercategory"] for cat in cats])))
         labels_names = ["N/A"] * (nb_category + 1)
         for cat in cats:
             labels_names[cat["id"]] = cat["name"]
@@ -129,7 +139,7 @@ def __init__(
         self.items = self.ids
 
     def getitem(self, idx):
-        """Get the :mod:`Frame <aloscene.frame>` corresponds to *idx* index
+        """ Get the :mod:`Frame <aloscene.frame>` corresponds to *idx* index
 
         Parameters
         ----------
@@ -144,7 +154,10 @@ def getitem(self, idx):
         if self.sample:
             return BaseDataset.__getitem__(self, idx)
         img, target = CocoDetectionSample.__getitem__(self, idx)
+
         image_id = self.ids[idx]
+        if self.coco_stuff is not None:
+            target += self.coco_stuff.loadAnns(self.coco_stuff.getAnnIds(image_id))
         target = {"image_id": image_id, "annotations": target}
 
         frame = Frame(np.transpose(np.array(img), [2, 0, 1]), names=("C", "H", "W"))
@@ -171,10 +184,12 @@ def getitem(self, idx):
             names=("N", None),
             labels=labels_2d,
         )
-
-        # frame.append_boxes2d(boxes.xcyc().rel_pos())
         frame.append_boxes2d(boxes)
 
+        if self.prepare.return_masks:
+            segmentation = Mask(target["masks"], names=("N", "H", "W"), labels=labels_2d)
+            frame.append_segmentation(segmentation)
+
         return frame
 
 
@@ -198,8 +213,9 @@ def __init__(self, return_masks: bool = False):
     def convert_coco_poly_to_mask(self, segmentations, height, width):
         masks = []
         for polygons in segmentations:
-            rles = coco_mask.frPyObjects(polygons, height, width)
-            mask = coco_mask.decode(rles)
+            if isinstance(polygons, list):
+                polygons = coco_mask.frPyObjects(polygons, height, width)
+            mask = coco_mask.decode(polygons)
             if len(mask.shape) < 3:
                 mask = mask[..., None]
             mask = torch.as_tensor(mask, dtype=torch.uint8)
@@ -281,15 +297,14 @@ def show_random_frame(coco_loader):
 
 def main():
     """Main"""
-    logging.basicConfig(
-        level=logging.INFO,
-        format="[%(asctime)s][%(levelname)s] %(message)s",
-        datefmt="%d-%m-%y %H:%M:%S",
-    )
-    log = logging.getLogger("aloception")
-
+    # coco_dataset = CocoDetectionDataset(
+    #     img_folder="val2017",
+    #     stuff_ann_file="annotations/stuff_val2017.json",
+    #     ann_file="annotations/instances_val2017.json",
+    #     return_masks=True,
+    # )
     coco_dataset = CocoDetectionDataset(sample=True)
-    log.info(repr(coco_dataset))
+
     for f, frames in enumerate(coco_dataset.train_loader(batch_size=2)):
         frames = Frame.batch_list(frames)
         frames.get_view().render()

diff --git a/aloscene/__init__.py b/aloscene/__init__.py
@@ -7,5 +7,5 @@
 from .oriented_boxes_2d import OrientedBoxes2D
 from .mask import Mask
 from .flow import Flow
-from .disparity import Disparity
 from .frame import Frame
+from .disparity import Disparity
diff --git a/aloscene/frame.py b/aloscene/frame.py
@@ -1,21 +1,15 @@
-from aloscene.disparity import Disparity
-from importlib.abc import ExecutionLoader
 import torch
-import torchvision.transforms.functional as F
 import torchvision
-from typing import *
-from torch import Tensor
-import numpy as np
-from collections import namedtuple
-import inspect
-import time
+from typing import TypeVar, Union
 
+# from collections import namedtuple
 
 import aloscene
-from aloscene.renderer import View, Renderer
-from aloscene import BoundingBoxes2D, Labels, Flow, Mask, Disparity
-from aloscene import BoundingBoxes2D, Labels, Flow, Mask, BoundingBoxes3D
-from aloscene.camera_calib import CameraExtrinsic, CameraIntrinsic
+from aloscene.renderer import View
+from aloscene.disparity import Disparity
+from aloscene import BoundingBoxes2D, BoundingBoxes3D, Flow, Mask
+
+# from aloscene.camera_calib import CameraExtrinsic, CameraIntrinsic
 from aloscene.io.image import load_image
 
 Frame = TypeVar("Frame")
@@ -32,6 +26,7 @@ def __new__(
         boxes3d: Union[dict, BoundingBoxes3D] = None,
         flow: Flow = None,
         mask: Mask = None,
+        segmentation: Mask = None,
         disparity: Disparity = None,
         normalization="255",
         mean_std=None,
@@ -52,6 +47,7 @@ def __new__(
         tensor.add_label("flow", flow, align_dim=["B", "T"], mergeable=False)
         tensor.add_label("mask", mask, align_dim=["B", "T"], mergeable=True)
         tensor.add_label("disparity", disparity, align_dim=["B", "T"], mergeable=True)
+        tensor.add_label("segmentation", segmentation, align_dim=["B", "T"], mergeable=False)
 
         # Add other tensor property
         tensor.add_property("normalization", normalization)
@@ -142,6 +138,20 @@ def append_disparity(self, disparity, name=None):
         """
         self._append_label("disparity", disparity, name)
 
+    def append_segmentation(self, segmentation: Mask, name: str = None):
+        """Attach a segmentation to the frame.
+
+        Parameters
+        ----------
+        segmentation: aloscene.Mask
+            Mask with size (N,H,W), where N is the features maps, each one for one object.
+            Each feature map must be a binary mask. For that, is a type of aloscene.Mask
+        name: str
+            If none, the mask will be attached without name (if possible). Otherwise if no other unnamed
+            mask are attached to the frame, the mask will be added to the set of mask.
+        """
+        self._append_label("segmentation", segmentation, name)
+
     @staticmethod
     def _get_mean_std_tensor(shape, names, mean_std: tuple, device="cpu"):
         """Utils method to a get the mean and the std
@@ -193,7 +203,8 @@ def norm_as(self, target_frame) -> Frame:
             )
         else:
             raise Exception(
-                f"Can't convert the tensor normalization to the target_frame normalization: {target_frame.normalization}"
+                "Can't convert the tensor normalization to the"
+                + f"target_frame normalization: {target_frame.normalization}"
             )
 
     def norm255(self) -> Frame: