Az/yolo format support (#619)

* added yolo loader/dumper * changed format_spec * updated reamde, changelog * Used bold font for default dump format
7 years ago · 1454ec7ecc
parent f17847ff33
commit 1454ec7ecc
13 changed files with 204 additions and 40 deletions
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -18,7 +18,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
 - Ability to create a custom extractors for unsupported media types
 - Added in PDF extractor
 - Added in a command line model manager tester
- Pascal VOC format support
+- Ability to dump/load annotations in several formats from UI (CVAT, Pascal VOC, YOLO)

 ### Changed
 - Outside and keyframe buttons in the side panel for all interpolation shapes (they were only for boxes before)
--- a/README.md
+++ b/README.md
@ -27,13 +27,15 @@ CVAT is free, online, interactive video and image annotation tool for computer v
 - [Tutorial for polygons](https://www.youtube.com/watch?v=XTwfXDh4clI)
 - [Semi-automatic segmentation](https://www.youtube.com/watch?v=vnqXZ-Z-VTQ)

-## Supported formats
+## Supported annotation formats

+Format selection is possible after clicking on the Upload annotation / Dump annotation button.
 | Annotation format         | Dumper | Loader |
 | ------------------------- | ------ | ------ |
 | CVAT XML v1.1 for images  | X      | X      |
 | CVAT XML v1.1 for a video | X      | X      |
 | Pascal VOC                | X      | X      |
+| YOLO                      | X      | X      |

 ## Links
 - [Intel AI blog: New Computer Vision Tool Accelerates Annotation of Digital Images and Video](https://www.intel.ai/introducing-cvat)
--- a/cvat/apps/annotation/annotation.py
+++ b/cvat/apps/annotation/annotation.py
@ -119,9 +119,9 @@ class Annotation:
        self._create_callback=create_callback
        self._MAX_ANNO_SIZE=30000

-        db_labels = self._db_task.label_set.all().prefetch_related('attributespec_set')
+        db_labels = self._db_task.label_set.all().prefetch_related('attributespec_set').order_by('pk')

-        self._label_mapping = {db_label.id: db_label for db_label in db_labels}
+        self._label_mapping = OrderedDict((db_label.id, db_label) for db_label in db_labels)

        self._attribute_mapping = {
            'mutable': {},
--- a/cvat/apps/annotation/pascal_voc.py
+++ b/cvat/apps/annotation/pascal_voc.py
@ -45,7 +45,7 @@ def load(file_object, annotations):
    def parse_xml_file(annotation_file):
        import xml.etree.ElementTree as ET
        root = ET.parse(annotation_file).getroot()
-        filename = root.find('filename').text
+        frame_number = match_frame(annotations.frame_info, root.find('filename').text)

        for obj_tag in root.iter('object'):
            bbox_tag = obj_tag.find("bndbox")
@ -57,14 +57,14 @@ def load(file_object, annotations):

            annotations.add_shape(annotations.LabeledShape(
                type='rectangle',
-                frame=match_frame(annotations.frame_info, filename),
+                frame=frame_number,
                label=label,
                points=[xmin, ymin, xmax, ymax],
                occluded=False,
                attributes=[],
            ))

-    archive_file = file_object if isinstance(file_object, str) else getattr(file_object, 'name')
+    archive_file = getattr(file_object, 'name')
    with TemporaryDirectory() as tmp_dir:
        Archive(archive_file).extractall(tmp_dir)

--- a/cvat/apps/annotation/settings.py
+++ b/cvat/apps/annotation/settings.py
@ -8,4 +8,5 @@ path_prefix = os.path.join('cvat', 'apps', 'annotation')
 BUILTIN_FORMATS = (
    os.path.join(path_prefix, 'cvat.py'),
    os.path.join(path_prefix,'pascal_voc.py'),
+    os.path.join(path_prefix,'yolo.py'),
 )
--- a/cvat/apps/annotation/yolo.py
+++ b/cvat/apps/annotation/yolo.py
@ -0,0 +1,136 @@
+format_spec = {
+    "name": "YOLO",
+    "dumpers": [
+        {
+            "display_name": "{name} {format} {version}",
+            "format": "ZIP",
+            "version": "1.0",
+            "handler": "dump"
+        },
+    ],
+    "loaders": [
+        {
+            "display_name": "{name} {format} {version}",
+            "format": "ZIP",
+            "version": "1.0",
+            "handler": "load"
+        },
+    ],
+}
+
+def get_filename(path):
+    import os
+    return os.path.splitext(os.path.basename(path))[0]
+
+def load(file_object, annotations):
+    from pyunpack import Archive
+    import os
+    from tempfile import TemporaryDirectory
+    from glob import glob
+
+    def convert_from_yolo(img_size, box):
+        # convertation formulas are based on https://github.com/pjreddie/darknet/blob/master/scripts/voc_label.py
+        # <x> <y> <width> <height> - float values relative to width and height of image
+        # <x> <y> - are center of rectangle
+        def clamp(value, _min, _max):
+            return max(min(_max, value), _min)
+        xtl = clamp(img_size[0] * (box[0] - box[2] / 2), 0, img_size[0])
+        ytl = clamp(img_size[1] * (box[1] - box[3] / 2), 0, img_size[1])
+        xbr = clamp(img_size[0] * (box[0] + box[2] / 2), 0, img_size[0])
+        ybr = clamp(img_size[1] * (box[1] + box[3] / 2), 0, img_size[1])
+
+        return [xtl, ytl, xbr, ybr]
+
+    def parse_yolo_obj(img_size, obj):
+        label_id, x, y, w, h = obj.split(" ")
+        return int(label_id), convert_from_yolo(img_size, (float(x), float(y), float(w), float(h)))
+
+    def match_frame(frame_info, filename):
+        import re
+        # try to match by filename
+        yolo_filename = get_filename(filename)
+        for frame_number, info in frame_info.items():
+            cvat_filename = get_filename(info["path"])
+            if cvat_filename == yolo_filename:
+                return frame_number
+
+        # try to extract frame number from filename
+        numbers = re.findall(r"\d+", filename)
+        if numbers and len(numbers) == 1:
+            return int(numbers[0])
+
+        raise Exception("Cannot match filename or determinate framenumber for {} filename".format(filename))
+
+    def parse_yolo_file(annotation_file, labels_mapping):
+        frame_number = match_frame(annotations.frame_info, annotation_file)
+        with open(annotation_file, "r") as fp:
+            line = fp.readline()
+            while line:
+                frame_info = annotations.frame_info[frame_number]
+                label_id, points = parse_yolo_obj((frame_info["width"], frame_info["height"]), line)
+                annotations.add_shape(annotations.LabeledShape(
+                    type="rectangle",
+                    frame=frame_number,
+                    label=labels_mapping[label_id],
+                    points=points,
+                    occluded=False,
+                    attributes=[],
+                ))
+                line = fp.readline()
+
+    def load_labels(labels_file):
+        with open(labels_file, "r") as f:
+            return {idx: label.strip() for idx, label in enumerate(f.readlines()) if label.strip()}
+
+    archive_file = file_object if isinstance(file_object, str) else getattr(file_object, "name")
+    with TemporaryDirectory() as tmp_dir:
+        Archive(archive_file).extractall(tmp_dir)
+
+        labels_file = glob(os.path.join(tmp_dir, "*.names"))
+        if not labels_file:
+            raise Exception("Could not find '*.names' file with labels in uploaded archive")
+        elif len(labels_file) == 1:
+            labels_mapping = load_labels(labels_file[0])
+        else:
+            raise Exception("Too many '*.names' files in uploaded archive: {}".format(labels_file))
+
+        for dirpath, _, filenames in os.walk(tmp_dir):
+            for file in filenames:
+                if ".txt" == os.path.splitext(file)[1]:
+                    parse_yolo_file(os.path.join(dirpath, file), labels_mapping)
+
+def dump(file_object, annotations):
+    from zipfile import ZipFile
+
+    # convertation formulas are based on https://github.com/pjreddie/darknet/blob/master/scripts/voc_label.py
+    # <x> <y> <width> <height> - float values relative to width and height of image
+    # <x> <y> - are center of rectangle
+    def convert_to_yolo(img_size, box):
+        x = (box[0] + box[2]) / 2 / img_size[0]
+        y = (box[1] + box[3]) / 2 / img_size[1]
+        w = (box[2] - box[0]) / img_size[0]
+        h = (box[3] - box[1]) / img_size[1]
+
+        return x, y, w, h
+
+    labels_ids = {label[1]["name"]: idx for idx, label in enumerate(annotations.meta["task"]["labels"])}
+
+    with ZipFile(file_object, "w") as output_zip:
+        for frame_annotation in annotations.group_by_frame():
+            image_name = frame_annotation.name
+            annotation_name = "{}.txt".format(get_filename(image_name))
+            width = frame_annotation.width
+            height = frame_annotation.height
+
+            yolo_annotation = ""
+            for shape in frame_annotation.labeled_shapes:
+                if shape.type != "rectangle":
+                    continue
+
+                label = shape.label
+                yolo_bb = convert_to_yolo((width, height), shape.points)
+                yolo_bb = " ".join("{:.6f}".format(p) for p in yolo_bb)
+                yolo_annotation += "{} {}\n".format(labels_ids[label], yolo_bb)
+
+            output_zip.writestr(annotation_name, yolo_annotation)
+        output_zip.writestr("obj.names", "\n".join(l[0] for l in sorted(labels_ids.items(), key=lambda x:x[1])))
--- a/cvat/apps/auto_annotation/model_manager.py
+++ b/cvat/apps/auto_annotation/model_manager.py
@ -10,8 +10,6 @@ import rq
 import shutil
 import tempfile
 import itertools
-import sys
-import traceback

 from django.db import transaction
 from django.utils import timezone
@ -26,7 +24,8 @@ from cvat.apps.engine.annotation import put_task_data, patch_task_data
 from .models import AnnotationModel, FrameworkChoice
 from .model_loader import ModelLoader, load_labelmap
 from .image_loader import ImageLoader
-from cvat.apps.engine.utils.import_modules import import_modules
+from cvat.apps.engine.utils import import_modules, execute_python_code
+


 def _remove_old_file(model_file_field):
@ -269,9 +268,6 @@ class Results():
            "attributes": attributes or {},
        }

-class InterpreterError(Exception):
-    pass
-
 def _process_detections(detections, path_to_conv_script, restricted=True):
    results = Results()
    local_vars = {
@ -296,21 +292,10 @@ def _process_detections(detections, path_to_conv_script, restricted=True):
        imports = import_modules(source_code)
        global_vars.update(imports)

-    try:
-        exec(source_code, global_vars, local_vars)
-    except SyntaxError as err:
-        error_class = err.__class__.__name__
-        detail = err.args[0]
-        line_number = err.lineno
-    except Exception as err:
-        error_class = err.__class__.__name__
-        detail = err.args[0]
-        cl, exc, tb = sys.exc_info()
-        line_number = traceback.extract_tb(tb)[-1][1]
-    else:
-        return results

-    raise InterpreterError("%s at line %d: %s" % (error_class, line_number, detail))
+    execute_python_code(source_code, global_vars, local_vars)
+
+    return results

 def run_inference_engine_annotation(data, model_file, weights_file,
       labels_mapping, attribute_spec, convertation_file, job=None, update_progress=None, restricted=True):
--- a/cvat/apps/dashboard/static/dashboard/js/dashboard.js
+++ b/cvat/apps/dashboard/static/dashboard/js/dashboard.js
@ -11,6 +11,7 @@
    LabelsInfo:false
    showMessage:false
    showOverlay:false
+    isDefaultFormat:false
 */

 class TaskView {
@ -138,10 +139,15 @@ class TaskView {

        for (const format of this._annotationFormats) {
            for (const dumper of format.dumpers) {
-                dropdownDownloadMenu.append($(`<li>${dumper.display_name}</li>`).on('click', () => {
+                const listItem = $(`<li>${dumper.display_name}</li>`).on('click', () => {
                    dropdownDownloadMenu.addClass('hidden');
                    this._dump(downloadButton[0], dumper.display_name);
-                }));
+                });
+
+                if (isDefaultFormat(dumper.display_name, this._task.mode)) {
+                    listItem.addClass('bold');
+                }
+                dropdownDownloadMenu.append(listItem);
            }

            for (const loader of format.loaders) {
--- a/cvat/apps/engine/annotation.py
+++ b/cvat/apps/engine/annotation.py
@ -13,12 +13,12 @@ from django.db import transaction
 from cvat.apps.profiler import silk_profile
 from cvat.apps.engine.plugins import plugin_decorator
 from cvat.apps.annotation.annotation import AnnotationIR, Annotation
+from cvat.apps.engine.utils import execute_python_code, import_modules

 from . import models
 from .data_manager import DataManager
 from .log import slogger
 from . import serializers
-from .utils.import_modules import import_modules

 class PatchAction(str, Enum):
    CREATE = "create"
@ -593,12 +593,13 @@ class JobAnnotation:
            global_vars = globals()
            imports = import_modules(source_code)
            global_vars.update(imports)
-            exec(source_code, global_vars)
+
+            execute_python_code(source_code, global_vars)

            global_vars["file_object"] = file_object
            global_vars["annotations"] = annotation_importer

-            exec("{}(file_object, annotations)".format(loader.handler), global_vars)
+            execute_python_code("{}(file_object, annotations)".format(loader.handler), global_vars)
        self.create(annotation_importer.data.slice(self.start_frame, self.stop_frame).serialize())

 class TaskAnnotation:
@ -679,11 +680,11 @@ class TaskAnnotation:
            global_vars = globals()
            imports = import_modules(source_code)
            global_vars.update(imports)
-            exec(source_code, global_vars)
+            execute_python_code(source_code, global_vars)
            global_vars["file_object"] = dump_file
            global_vars["annotations"] = anno_exporter

-            exec("{}(file_object, annotations)".format(dumper.handler), global_vars)
+            execute_python_code("{}(file_object, annotations)".format(dumper.handler), global_vars)

    def upload(self, annotation_file, loader):
        annotation_importer = Annotation(
@ -698,12 +699,12 @@ class TaskAnnotation:
            global_vars = globals()
            imports = import_modules(source_code)
            global_vars.update(imports)
-            exec(source_code, global_vars)
+            execute_python_code(source_code, global_vars)

            global_vars["file_object"] = file_object
            global_vars["annotations"] = annotation_importer

-            exec("{}(file_object, annotations)".format(loader.handler), global_vars)
+            execute_python_code("{}(file_object, annotations)".format(loader.handler), global_vars)
        self.create(annotation_importer.data.serialize())

    @property
--- a/cvat/apps/engine/static/engine/js/annotationUI.js
+++ b/cvat/apps/engine/static/engine/js/annotationUI.js
@ -46,6 +46,7 @@
    buildAnnotationSaver:false
    LabelsInfo:false
    uploadJobAnnotationRequest:false
+    isDefaultFormat:false
 */

 async function initLogger(jobID) {
@ -389,7 +390,7 @@ function setupMenu(job, task, shapeCollectionModel,

    for (const format of annotationFormats) {
        for (const dumpSpec of format.dumpers) {
-            $(`<li>${dumpSpec.display_name}</li>`).on('click', async () => {
+            const listItem = $(`<li>${dumpSpec.display_name}</li>`).on('click', async () => {
                $('#downloadAnnotationButton')[0].disabled = true;
                $('#downloadDropdownMenu').addClass('hidden');
                try {
@ -399,7 +400,11 @@ function setupMenu(job, task, shapeCollectionModel,
                } finally {
                    $('#downloadAnnotationButton')[0].disabled = false;
                }
-            }).appendTo('#downloadDropdownMenu');
+            });
+            if (isDefaultFormat(dumpSpec.display_name, task.mode)) {
+                listItem.addClass('bold');
+            }
+            $('#downloadDropdownMenu').append(listItem);
        }

        for (const loader of format.loaders) {
--- a/cvat/apps/engine/static/engine/js/base.js
+++ b/cvat/apps/engine/static/engine/js/base.js
@ -11,6 +11,7 @@
    showOverlay
    uploadJobAnnotationRequest
    uploadTaskAnnotationRequest
+    isDefaultFormat
 */

 /* global
@ -221,3 +222,8 @@ $(document).ready(() => {
        height: `${window.screen.height * 0.95}px`,
    });
 });
+
+function isDefaultFormat(dumperName, taskMode) {
+    return (dumperName === 'CVAT XML 1.1 for videos' && taskMode === 'interpolation')
+    || (dumperName === 'CVAT XML 1.1 for images' && taskMode === 'annotation');
+}
--- a/cvat/apps/engine/utils/import_modules.py
+++ b/cvat/apps/engine/utils/import_modules.py
@ -1,6 +1,8 @@
 import ast
 from collections import namedtuple
 import importlib
+import sys
+import traceback

 Import = namedtuple("Import", ["module", "name", "alias"])

@ -34,3 +36,21 @@ def import_modules(source_code: str):
            results[import_.name] = loaded_module

    return results
+
+class InterpreterError(Exception):
+    pass
+
+def execute_python_code(source_code, global_vars=None, local_vars=None):
+    try:
+        exec(source_code, global_vars, local_vars)
+    except SyntaxError as err:
+        error_class = err.__class__.__name__
+        details = err.args[0]
+        line_number = err.lineno
+        raise InterpreterError("{} at line {}: {}".format(error_class, line_number, details))
+    except Exception as err:
+        error_class = err.__class__.__name__
+        details = err.args[0]
+        _, _, tb = sys.exc_info()
+        line_number = traceback.extract_tb(tb)[-1][1]
+        raise InterpreterError("{} at line {}: {}".format(error_class, line_number, details))
--- a/cvat/apps/engine/views.py
+++ b/cvat/apps/engine/views.py
@ -306,8 +306,9 @@ class TaskViewSet(auth.TaskGetQuerySetMixin, viewsets.ModelViewSet):
                    finally:
                        rq_job.delete()
            elif rq_job.is_failed:
+                exc_info = str(rq_job.exc_info)
                rq_job.delete()
-                return Response(status=status.HTTP_500_INTERNAL_SERVER_ERROR)
+                return Response(data=exc_info, status=status.HTTP_500_INTERNAL_SERVER_ERROR)
            else:
                return Response(status=status.HTTP_202_ACCEPTED)

@ -534,7 +535,8 @@ def load_data_proxy(request, rq_id, rq_func, pk):
        elif rq_job.is_failed:
            os.close(rq_job.meta['tmp_file_descriptor'])
            os.remove(rq_job.meta['tmp_file'])
+            exc_info = str(rq_job.exc_info)
            rq_job.delete()
-            return Response(status=status.HTTP_500_INTERNAL_SERVER_ERROR)
+            return Response(data=exc_info, status=status.HTTP_500_INTERNAL_SERVER_ERROR)

    return Response(status=status.HTTP_202_ACCEPTED)