Add tags to cvat xml (#1200)

* Extend cvat format test * Add tags to cvat for images * Add tags to cvat format in dm * Add import of tags from datumaro
6 years ago · a058765d29
parent 0dae5def6b
commit a058765d29
6 changed files with 165 additions and 12 deletions
--- a/cvat/apps/annotation/cvat.py
+++ b/cvat/apps/annotation/cvat.py
@ -124,6 +124,11 @@ def create_xml_dumper(file_object):
            self.xmlgen.startElement("cuboid", cuboid)
            self._level += 1

+        def open_tag(self, tag):
+            self._indent()
+            self.xmlgen.startElement("tag", tag)
+            self._level += 1
+
        def add_attribute(self, attribute):
            self._indent()
            self.xmlgen.startElement("attribute", {"name": attribute["name"]})
@ -155,6 +160,11 @@ def create_xml_dumper(file_object):
            self._indent()
            self.xmlgen.endElement("cuboid")

+        def close_tag(self):
+            self._level -= 1
+            self._indent()
+            self.xmlgen.endElement("tag")
+
        def close_image(self):
            self._level -= 1
            self._indent()
@ -268,6 +278,22 @@ def dump_as_cvat_annotation(file_object, annotations):
            else:
                raise NotImplementedError("unknown shape type")

+        for tag in frame_annotation.tags:
+            tag_data = OrderedDict([
+                ("label", tag.label),
+            ])
+            if tag.group:
+                tag_data["group_id"] = str(tag.group)
+            dumper.open_tag(tag_data)
+
+            for attr in tag.attributes:
+                dumper.add_attribute(OrderedDict([
+                    ("name", attr.name),
+                    ("value", attr.value)
+                ]))
+
+            dumper.close_tag()
+
        dumper.close_image()
    dumper.close_root()

@ -408,7 +434,9 @@ def load(file_object, annotations):

    track = None
    shape = None
+    tag = None
    image_is_opened = False
+    attributes = None
    for ev, el in context:
        if ev == 'start':
            if el.tag == 'track':
@ -421,13 +449,22 @@ def load(file_object, annotations):
                image_is_opened = True
                frame_id = int(el.attrib['id'])
            elif el.tag in supported_shapes and (track is not None or image_is_opened):
+                attributes = []
                shape = {
-                    'attributes': [],
+                    'attributes': attributes,
                    'points': [],
                }
+            elif el.tag == 'tag' and image_is_opened:
+                attributes = []
+                tag = {
+                    'frame': frame_id,
+                    'label': el.attrib['label'],
+                    'group': int(el.attrib.get('group_id', 0)),
+                    'attributes': attributes,
+                }
        elif ev == 'end':
-            if el.tag == 'attribute' and shape is not None:
-                shape['attributes'].append(annotations.Attribute(
+            if el.tag == 'attribute' and attributes is not None:
+                attributes.append(annotations.Attribute(
                    name=el.attrib['name'],
                    value=el.text,
                ))
@ -484,4 +521,7 @@ def load(file_object, annotations):
                track = None
            elif el.tag == 'image':
                image_is_opened = False
+            elif el.tag == 'tag':
+                annotations.add_tag(annotations.Tag(**tag))
+                tag = None
            el.clear()
--- a/cvat/apps/dataset_manager/bindings.py
+++ b/cvat/apps/dataset_manager/bindings.py
@ -236,5 +236,14 @@ def import_dm_annotations(dm_dataset, cvat_task_anno):
                    points=ann.points,
                    occluded=False,
                    group=group_map.get(ann.group, 0),
-                    attributes=[],
+                    attributes=[cvat_task_anno.Attribute(name=n, value=str(v))
+                        for n, v in ann.attributes.items()],
+                ))
+            elif ann.type == datumaro.AnnotationType.label:
+                cvat_task_anno.add_shape(cvat_task_anno.Tag(
+                    frame=frame_number,
+                    label=label_cat.items[ann.label].name,
+                    group=group_map.get(ann.group, 0),
+                    attributes=[cvat_task_anno.Attribute(name=n, value=str(v))
+                        for n, v in ann.attributes.items()],
                ))
--- a/cvat/apps/engine/tests/test_rest_api.py
+++ b/cvat/apps/engine/tests/test_rest_api.py
@ -2638,6 +2638,47 @@ class TaskAnnotationAPITestCase(JobAnnotationAPITestCase):
                "occluded": False
            }]

+            polygon_shapes_with_attrs = [{
+                "frame": 2,
+                "label_id": task["labels"][0]["id"],
+                "group": 1,
+                "attributes": [
+                    {
+                        "spec_id": task["labels"][0]["attributes"][0]["id"],
+                        "value": task["labels"][0]["attributes"][0]["values"][1]
+                    },
+                    {
+                        "spec_id": task["labels"][0]["attributes"][1]["id"],
+                        "value": task["labels"][0]["attributes"][1]["default_value"]
+                    }
+                ],
+                "points": [20.0, 0.1, 10, 3.22, 4, 7, 10, 30, 1, 2, 4.44, 5.55],
+                "type": "polygon",
+                "occluded": True
+            }]
+
+            tags_wo_attrs = [{
+                "frame": 2,
+                "label_id": task["labels"][1]["id"],
+                "group": 3,
+                "attributes": []
+            }]
+            tags_with_attrs = [{
+                "frame": 1,
+                "label_id": task["labels"][0]["id"],
+                "group": 0,
+                "attributes": [
+                    {
+                        "spec_id": task["labels"][0]["attributes"][0]["id"],
+                        "value": task["labels"][0]["attributes"][0]["values"][1]
+                    },
+                    {
+                        "spec_id": task["labels"][0]["attributes"][1]["id"],
+                        "value": task["labels"][0]["attributes"][1]["default_value"]
+                    }
+                ],
+            }]
+
            annotations = {
                    "version": 0,
                    "tags": [],
@ -2648,7 +2689,9 @@ class TaskAnnotationAPITestCase(JobAnnotationAPITestCase):
                annotations["tracks"] = rectangle_tracks_with_attrs + rectangle_tracks_wo_attrs

            elif annotation_format == "CVAT XML 1.1 for images":
-                annotations["shapes"] = rectangle_shapes_with_attrs + rectangle_shapes_wo_attrs
+                annotations["shapes"] = rectangle_shapes_with_attrs + rectangle_shapes_wo_attrs \
+                    + polygon_shapes_wo_attrs + polygon_shapes_with_attrs
+                annotations["tags"] = tags_with_attrs + tags_wo_attrs

            elif annotation_format == "PASCAL VOC ZIP 1.1" or \
                 annotation_format == "YOLO ZIP 1.1" or \
--- a/datumaro/datumaro/plugins/cvat_format/converter.py
+++ b/datumaro/datumaro/plugins/cvat_format/converter.py
@ -113,6 +113,11 @@ class XmlAnnotationWriter:
        self.xmlgen.startElement('points', points)
        self._level += 1

+    def open_tag(self, tag):
+        self._indent()
+        self.xmlgen.startElement("tag", tag)
+        self._level += 1
+
    def add_attribute(self, attribute):
        self._indent()
        self.xmlgen.startElement('attribute', {'name': attribute['name']})
@ -136,6 +141,9 @@ class XmlAnnotationWriter:
    def close_points(self):
        self._close_element('points')

+    def close_tag(self):
+        self._close_element('tag')
+
    def close_image(self):
        self._close_element('image')

@ -201,6 +209,8 @@ class _SubsetWriter:
            if ann.type in {AnnotationType.points, AnnotationType.polyline,
                    AnnotationType.polygon, AnnotationType.bbox}:
                self._write_shape(ann)
+            elif ann.type == AnnotationType.label:
+                self._write_tag(ann)
            else:
                continue

@ -303,6 +313,28 @@ class _SubsetWriter:
        else:
            raise NotImplementedError("unknown shape type")

+    def _write_tag(self, label):
+        if label.label is None:
+            return
+
+        tag_data = OrderedDict([
+            ('label', self._get_label(label.label).name),
+        ])
+        if label.group:
+            tag_data['group_id'] = str(label.group)
+        self._writer.open_tag(tag_data)
+
+        for attr_name, attr_value in label.attributes.items():
+            if isinstance(attr_value, bool):
+                attr_value = 'true' if attr_value else 'false'
+            if attr_name in self._get_label(label.label).attributes:
+                self._writer.add_attribute(OrderedDict([
+                    ("name", str(attr_name)),
+                    ("value", str(attr_value)),
+                ]))
+
+        self._writer.close_tag()
+
 class _Converter:
    def __init__(self, extractor, save_dir, save_images=False):
        self._extractor = extractor
--- a/datumaro/datumaro/plugins/cvat_format/extractor.py
+++ b/datumaro/datumaro/plugins/cvat_format/extractor.py
@ -9,7 +9,7 @@ import xml.etree as ET

 from datumaro.components.extractor import (SourceExtractor,
    DEFAULT_SUBSET_NAME, DatasetItem,
-    AnnotationType, Points, Polygon, PolyLine, Bbox,
+    AnnotationType, Points, Polygon, PolyLine, Bbox, Label,
    LabelCategories
 )
 from datumaro.util.image import Image
@ -73,6 +73,8 @@ class CvatExtractor(SourceExtractor):

        track = None
        shape = None
+        tag = None
+        attributes = None
        image = None
        for ev, el in context:
            if ev == 'start':
@ -92,16 +94,25 @@ class CvatExtractor(SourceExtractor):
                        'height': el.attrib.get('height'),
                    }
                elif el.tag in cls._SUPPORTED_SHAPES and (track or image):
+                    attributes = {}
                    shape = {
                        'type': None,
-                        'attributes': {},
+                        'attributes': attributes,
                    }
                    if track:
                        shape.update(track)
                    if image:
                        shape.update(image)
+                elif el.tag == 'tag' and image:
+                    attributes = {}
+                    tag = {
+                        'frame': image['frame'],
+                        'attributes': attributes,
+                        'group': int(el.attrib.get('group_id', 0)),
+                        'label': el.attrib['label'],
+                    }
            elif ev == 'end':
-                if el.tag == 'attribute' and shape is not None:
+                if el.tag == 'attribute' and attributes is not None:
                    attr_value = el.text
                    if el.text in ['true', 'false']:
                        attr_value = attr_value == 'true'
@ -110,7 +121,7 @@ class CvatExtractor(SourceExtractor):
                            attr_value = float(attr_value)
                        except Exception:
                            pass
-                    shape['attributes'][el.attrib['name']] = attr_value
+                    attributes[el.attrib['name']] = attr_value
                elif el.tag in cls._SUPPORTED_SHAPES:
                    if track is not None:
                        shape['frame'] = el.attrib['frame']
@ -136,10 +147,16 @@ class CvatExtractor(SourceExtractor):

                    frame_desc = items.get(shape['frame'], {'annotations': []})
                    frame_desc['annotations'].append(
-                        cls._parse_ann(shape, categories))
+                        cls._parse_shape_ann(shape, categories))
                    items[shape['frame']] = frame_desc
                    shape = None

+                elif el.tag == 'tag':
+                    frame_desc = items.get(tag['frame'], {'annotations': []})
+                    frame_desc['annotations'].append(
+                        cls._parse_tag_ann(tag, categories))
+                    items[tag['frame']] = frame_desc
+                    tag = None
                elif el.tag == 'track':
                    track = None
                elif el.tag == 'image':
@ -252,7 +269,7 @@ class CvatExtractor(SourceExtractor):
        return categories, frame_size

    @classmethod
-    def _parse_ann(cls, ann, categories):
+    def _parse_shape_ann(cls, ann, categories):
        ann_id = ann.get('id')
        ann_type = ann['type']

@ -294,6 +311,14 @@ class CvatExtractor(SourceExtractor):
        else:
            raise NotImplementedError("Unknown annotation type '%s'" % ann_type)

+    @classmethod
+    def _parse_tag_ann(cls, ann, categories):
+        label = ann.get('label')
+        label_id = categories[AnnotationType.label].find(label)[0]
+        group = ann.get('group')
+        attributes = ann.get('attributes')
+        return Label(label_id, attributes=attributes, group=group)
+
    def _load_items(self, parsed):
        for frame_id, item_desc in parsed.items():
            filename = item_desc.get('name')
--- a/datumaro/tests/test_cvat_format.py
+++ b/datumaro/tests/test_cvat_format.py
@ -6,7 +6,7 @@ from xml.etree import ElementTree as ET
 from unittest import TestCase

 from datumaro.components.extractor import (Extractor, DatasetItem,
-    AnnotationType, Points, Polygon, PolyLine, Bbox,
+    AnnotationType, Points, Polygon, PolyLine, Bbox, Label,
    LabelCategories,
 )
 from datumaro.plugins.cvat_format.importer import CvatImporter
@ -173,6 +173,8 @@ class CvatConverterTest(TestCase):
                            Points([1, 1, 3, 2, 2, 3],
                                label=2,
                                attributes={ 'a1': 'x', 'a2': 42 }),
+                            Label(1),
+                            Label(2, attributes={ 'a1': 'y', 'a2': 44 }),
                        ]
                    ),
                    DatasetItem(id=1, subset='s1',
@ -215,6 +217,8 @@ class CvatConverterTest(TestCase):
                                label=2,
                                attributes={ 'z_order': 0, 'occluded': False,
                                    'a1': 'x', 'a2': 42 }),
+                            Label(1),
+                            Label(2, attributes={ 'a1': 'y', 'a2': 44 }),
                        ]
                    ),
                    DatasetItem(id=1, subset='s1',