Handle attributes returned from nuclio detector (#3917)

4 years ago · ad11b587b5
parent 6f1d1222bf
commit ad11b587b5
9 changed files with 302 additions and 34 deletions
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@ -7,6 +7,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0

 ## \[2.0.0] - Unreleased
 ### Added
+- Handle attributes comming from nuclio detectors (<https://github.com/openvinotoolkit/cvat/pull/3917>)
 - Add additional environment variables for Nuclio configuration (<https://github.com/openvinotoolkit/cvat/pull/3894>)
 - Add KITTI segmentation and detection format (<https://github.com/openvinotoolkit/cvat/pull/3757>)
 - Add LFW format (<https://github.com/openvinotoolkit/cvat/pull/3770>)
--- a/cvat-ui/package-lock.json
+++ b/cvat-ui/package-lock.json
@ -1,12 +1,12 @@
 {
  "name": "cvat-ui",
-  "version": "1.35.1",
+  "version": "1.35.2",
  "lockfileVersion": 2,
  "requires": true,
  "packages": {
    "": {
      "name": "cvat-ui",
-      "version": "1.35.1",
+      "version": "1.35.2",
      "license": "MIT",
      "dependencies": {
        "@ant-design/icons": "^4.6.3",
--- a/cvat-ui/package.json
+++ b/cvat-ui/package.json
@ -1,6 +1,6 @@
 {
  "name": "cvat-ui",
-  "version": "1.35.1",
+  "version": "1.35.2",
  "description": "CVAT single-page application",
  "main": "src/index.tsx",
  "scripts": {
--- a/cvat-ui/src/components/annotation-page/standard-workspace/controls-side-bar/tools-control.tsx
+++ b/cvat-ui/src/components/annotation-page/standard-workspace/controls-side-bar/tools-control.tsx
@ -1,4 +1,4 @@
-// Copyright (C) 2020-2021 Intel Corporation
+// Copyright (C) 2020-2022 Intel Corporation
 //
 // SPDX-License-Identifier: MIT

@ -1014,6 +1014,13 @@ export class ToolsControlComponent extends React.PureComponent<Props, State> {
                </Row>
            );
        }
+        const attrsMap: Record<string, Record<string, number>> = {};
+        jobInstance.labels.forEach((label: any) => {
+            attrsMap[label.name] = {};
+            label.attributes.forEach((attr: any) => {
+                attrsMap[label.name][attr.name] = attr.id;
+            });
+        });

        return (
            <DetectorRunner
@ -1034,7 +1041,11 @@ export class ToolsControlComponent extends React.PureComponent<Props, State> {
                                frame,
                                occluded: false,
                                source: 'auto',
-                                attributes: {},
+                                attributes: (data.attributes as { name: string, value: string }[])
+                                    .reduce((mapping, attr) => {
+                                        mapping[attrsMap[data.label][attr.name]] = attr.value;
+                                        return mapping;
+                                    }, {} as Record<number, string>),
                                zOrder: curZOrder,
                            }),
                        );
--- a/cvat/apps/lambda_manager/views.py
+++ b/cvat/apps/lambda_manager/views.py
@ -1,7 +1,12 @@
+# Copyright (C) 2021 Intel Corporation
+#
+# SPDX-License-Identifier: MIT
+
 import base64
 import json
 from functools import wraps
 from enum import Enum
+from copy import deepcopy

 import django_rq
 import requests
@ -101,6 +106,13 @@ class LambdaFunction:
                "`{}` lambda function has non-unique labels".format(self.id),
                code=status.HTTP_404_NOT_FOUND)
        self.labels = labels
+        # mapping of labels and corresponding supported attributes
+        self.func_attributes = {item['name']: item.get('attributes', []) for item in spec}
+        for label, attributes in self.func_attributes.items():
+            if len([attr['name'] for attr in attributes]) != len(set([attr['name'] for attr in attributes])):
+                raise ValidationError(
+                    "`{}` lambda function has non-unique attributes for label {}".format(self.id, label),
+                    code=status.HTTP_404_NOT_FOUND)
        # state of the function
        self.state = data['status']['state']
        # description of the function
@ -141,6 +153,10 @@ class LambdaFunction:
            response.update({
                'state': self.state
            })
+        if self.kind is LambdaType.DETECTOR:
+            response.update({
+                'attributes': self.func_attributes
+            })

        return response

@ -153,11 +169,17 @@ class LambdaFunction:
                    "threshold": threshold,
                })
            quality = data.get("quality")
-            mapping = data.get("mapping")
-            mapping_by_default = {db_label.name:db_label.name
-                for db_label in (
-                        db_task.project.label_set if db_task.project_id else db_task.label_set
-                    ).all()}
+            mapping = data.get("mapping", {})
+            mapping_by_default = {}
+            task_attributes = {}
+            for db_label in (db_task.project.label_set if db_task.project_id else db_task.label_set).prefetch_related("attributespec_set").all():
+                mapping_by_default[db_label.name] = db_label.name
+                task_attributes[db_label.name] = {}
+                for attribute in db_label.attributespec_set.all():
+                    task_attributes[db_label.name][attribute.name] = {
+                        'input_rype': attribute.input_type,
+                        'values': attribute.values.split('\n')
+                    }
            if not mapping:
                # use mapping by default to avoid labels in mapping which
                # don't exist in the task
@ -165,7 +187,14 @@ class LambdaFunction:
            else:
                # filter labels in mapping which don't exist in the task
                mapping = {k:v for k,v in mapping.items() if v in mapping_by_default}
-
+            supported_attrs = {}
+            for func_label, func_attrs in self.func_attributes.items():
+                if func_label in mapping:
+                    supported_attrs[func_label] = {}
+                    task_attr_names = [task_attr for task_attr in task_attributes[mapping[func_label]]]
+                    for attr in func_attrs:
+                        if attr['name'] in task_attr_names:
+                            supported_attrs[func_label].update({attr["name"] : attr})
            if self.kind == LambdaType.DETECTOR:
                payload.update({
                    "image": self._get_image(db_task, data["frame"], quality)
@ -207,13 +236,53 @@ class LambdaFunction:
                code=status.HTTP_400_BAD_REQUEST)

        response = self.gateway.invoke(self, payload)
+        response_filtered = []
+        def check_attr_value(value, func_attr, db_attr):
+            if db_attr is None:
+                return False
+            func_attr_type = func_attr["input_type"]
+            db_attr_type = db_attr["input_type"]
+            # Check if attribute types are equal for function configuration and db spec
+            if func_attr_type == db_attr_type:
+                if func_attr_type == "number":
+                    return value.isnumeric()
+                elif func_attr_type == "checkbox":
+                    return value in ["true", "false"]
+                elif func_attr_type in ["select", "radio", "text"]:
+                    return True
+                else:
+                    return False
+            else:
+                if func_attr_type == "number":
+                    return db_attr_type in ["select", "radio", "text"] and value.isnumeric()
+                elif func_attr_type == "text":
+                    return db_attr_type == "text" or \
+                           (db_attr_type in ["select", "radio"] and len(value.split(" ")) == 1)
+                elif func_attr_type == "select":
+                    return db_attr["input_type"] in ["radio", "text"]
+                elif func_attr_type == "radio":
+                    return db_attr["input_type"] in ["select", "text"]
+                elif func_attr_type == "checkbox":
+                    return value in ["true", "false"]
+                else:
+                    return False
        if self.kind == LambdaType.DETECTOR:
-            if mapping:
-                for item in response:
-                    item["label"] = mapping.get(item["label"])
-                response = [item for item in response if item["label"]]
-
-        return response
+            for item in response:
+                if item['label'] in mapping:
+                    attributes = deepcopy(item.get("attributes", []))
+                    item["attributes"] = []
+                    for attr in attributes:
+                        db_attr = supported_attrs.get(item['label'], {}).get(attr["name"])
+                        func_attr = [func_attr for func_attr in self.func_attributes.get(item['label'], []) if func_attr['name'] == attr["name"]]
+                        # Skip current attribute if it was not declared as supportd in function config
+                        if not func_attr:
+                            continue
+                        if attr["name"] in supported_attrs.get(item['label'], {}) and check_attr_value(attr["value"], func_attr[0], db_attr):
+                            item["attributes"].append(attr)
+                    item['label'] = mapping[item['label']]
+                    response_filtered.append(item)
+
+        return response_filtered

    def _get_image(self, db_task, frame, quality):
        if quality is None or quality == "original":
@ -381,27 +450,31 @@ class LambdaJob:
                break

            for anno in annotations:
-                label_id = labels.get(anno["label"])
-                if label_id is None:
+                label = labels.get(anno["label"])
+                if label is None:
                    continue # Invalid label provided
+                if anno.get('attributes'):
+                    attrs = [{'spec_id': label['attributes'][attr['name']], 'value': attr['value']} for attr in anno.get('attributes') if attr['name'] in label['attributes']]
+                else:
+                    attrs = []
                if anno["type"].lower() == "tag":
                    results.append_tag({
                        "frame": frame,
-                        "label_id": label_id,
+                        "label_id": label['id'],
                        "source": "auto",
-                        "attributes": [],
+                        "attributes": attrs,
                        "group": None,
                    })
                else:
                    results.append_shape({
                        "frame": frame,
-                        "label_id": label_id,
+                        "label_id": label['id'],
                        "type": anno["type"],
                        "occluded": False,
                        "points": anno["points"],
                        "z_order": 0,
                        "group": None,
-                        "attributes": [],
+                        "attributes": attrs,
                        "source": "auto"
                    })

@ -512,7 +585,11 @@ class LambdaJob:
        if cleanup:
            dm.task.delete_task_data(db_task.id)
        db_labels = (db_task.project.label_set if db_task.project_id else db_task.label_set).prefetch_related("attributespec_set").all()
-        labels = {db_label.name:db_label.id for db_label in db_labels}
+        labels = {}
+        for label in db_labels:
+            labels[label.name] = {'id':label.id, 'attributes': {}}
+            for attr in label.attributespec_set.values():
+                labels[label.name]['attributes'][attr['name']] = attr['id']

        if function.kind == LambdaType.DETECTOR:
            LambdaJob._call_detector(function, db_task, labels, quality,
--- a/serverless/common/openvino/model_loader.py
+++ b/serverless/common/openvino/model_loader.py
@ -1,4 +1,3 @@
-
 # Copyright (C) 2020 Intel Corporation
 #
 # SPDX-License-Identifier: MIT
@ -13,14 +12,6 @@ class ModelLoader:
        network = ie_core.read_network(model, weights)
        self._network = network

-        # Check compatibility
-        supported_layers = ie_core.query_network(network, "CPU")
-        not_supported_layers = [l for l in network.layers.keys() if l not in supported_layers]
-        if len(not_supported_layers) != 0:
-            raise Exception(
-                "Following layers are not supported by the plugin for specified device {}:\n {}"
-                .format(ie_core.device, ", ".join(not_supported_layers)))
-
        # Initialize input blobs
        self._input_info_name = None
        for blob_name in network.inputs:
@ -41,7 +32,8 @@ class ModelLoader:
        input_type = network.inputs[self._input_blob_name]
        self._input_layout = input_type if isinstance(input_type, list) else input_type.shape

-    def infer(self, image, preprocessing=True):
+
+    def _prepare_inputs(self, image, preprocessing):
        image = np.array(image)
        _, _, h, w = self._input_layout
        if preprocessing:
@ -57,13 +49,20 @@ class ModelLoader:
        inputs = {self._input_blob_name: image}
        if self._input_info_name:
            inputs[self._input_info_name] = [h, w, 1]
+        return inputs

+    def infer(self, image, preprocessing=True):
+        inputs = self._prepare_inputs(image, preprocessing)
        results = self._net.infer(inputs)
        if len(results) == 1:
            return results[self._output_blob_name].copy()
        else:
            return results.copy()

+    def async_infer(self, image, preprocessing=True, request_id=0):
+        inputs = self._prepare_inputs(image, preprocessing)
+        return self._net.start_async(request_id=request_id, inputs=inputs)
+
    def input_size(self):
        return self._input_layout[2:]

--- a/serverless/openvino/omz/intel/face-detection-0205/function.yaml
+++ b/serverless/openvino/omz/intel/face-detection-0205/function.yaml
@ -0,0 +1,76 @@
+metadata:
+  name: openvino-omz-face-detection-0205
+  namespace: cvat
+  annotations:
+    name: Attributed face detection
+    type: detector
+    framework: openvino
+    spec: |
+      [
+        { "id": 0, "name": "face", "attributes": [
+          {
+            "name": "age",
+            "input_type": "number",
+            "values": ["0", "150", "1"]
+          },
+          {
+            "name": "gender",
+            "input_type": "select",
+            "values": ["female", "male"]
+          },
+          {
+            "name": "emotion",
+            "input_type": "select",
+            "values": ["neutral", "happy", "sad", "surprise", "anger"]
+          }]
+        }
+      ]
+
+spec:
+  description: Detection network finding faces and defining age, gender and emotion attributes
+  runtime: 'python:3.6'
+  handler: main:handler
+  eventTimeout: 30000s
+  env:
+    - name: NUCLIO_PYTHON_EXE_PATH
+      value: /opt/nuclio/common/openvino/python3
+
+  build:
+    image: cvat/openvino.omz.intel.face-detection-0205
+    baseImage: openvino/ubuntu18_dev:2021.1
+
+    directives:
+      preCopy:
+        - kind: USER
+          value: root
+        - kind: WORKDIR
+          value: /opt/nuclio
+        - kind: RUN
+          value: ln -s /usr/bin/pip3 /usr/bin/pip
+        - kind: RUN
+          value: /opt/intel/openvino/deployment_tools/open_model_zoo/tools/downloader/downloader.py --name face-detection-0205 -o /opt/nuclio/open_model_zoo
+        - kind: RUN
+          value: /opt/intel/openvino/deployment_tools/open_model_zoo/tools/downloader/downloader.py --name emotions-recognition-retail-0003 -o /opt/nuclio/open_model_zoo
+        - kind: RUN
+          value: /opt/intel/openvino/deployment_tools/open_model_zoo/tools/downloader/downloader.py --name age-gender-recognition-retail-0013 -o /opt/nuclio/open_model_zoo
+
+      postCopy:
+        - kind: RUN
+          value: apt update && DEBIAN_FRONTEND=noninteractive apt install --no-install-recommends -y python3-skimage
+        - kind: RUN
+          value: pip3 install "numpy<1.16.0" # workaround for skimage
+
+  triggers:
+    myHttpTrigger:
+      maxWorkers: 2
+      kind: 'http'
+      workerAvailabilityTimeoutMilliseconds: 10000
+      attributes:
+        maxRequestBodySize: 33554432 # 32MB
+
+  platform:
+    attributes:
+      restartPolicy:
+        name: always
+        maximumRetryCount: 3
+      mountMode: volume
--- a/serverless/openvino/omz/intel/face-detection-0205/main.py
+++ b/serverless/openvino/omz/intel/face-detection-0205/main.py
@ -0,0 +1,33 @@
+# Copyright (C) 2020-2022 Intel Corporation
+#
+# SPDX-License-Identifier: MIT
+
+import json
+import base64
+from PIL import Image
+import io
+from model_handler import FaceDetectorHandler, AttributesExtractorHandler
+
+def init_context(context):
+    context.logger.info("Init context...  0%")
+
+     # Read the DL model
+    context.user_data.detector_model = FaceDetectorHandler()
+    context.user_data.attributes_model = AttributesExtractorHandler()
+
+    context.logger.info("Init context...100%")
+
+def handler(context, event):
+    context.logger.info("Run face-detection-0206 model")
+    data = event.body
+    buf = io.BytesIO(base64.b64decode(data["image"]))
+    threshold = float(data.get("threshold", 0.5))
+    image = Image.open(buf)
+
+    results, faces = context.user_data.detector_model.infer(image, threshold)
+    for idx, face in enumerate(faces):
+        attributes =  context.user_data.attributes_model.infer(face)
+        results[idx].update(attributes)
+
+    return context.Response(body=json.dumps(results), headers={},
+        content_type='application/json', status_code=200)
--- a/serverless/openvino/omz/intel/face-detection-0205/model_handler.py
+++ b/serverless/openvino/omz/intel/face-detection-0205/model_handler.py
@ -0,0 +1,71 @@
+# Copyright (C) 2020-2022 Intel Corporation
+#
+# SPDX-License-Identifier: MIT
+
+import os
+import numpy as np
+from model_loader import ModelLoader
+
+class FaceDetectorHandler:
+    def __init__(self):
+        base_dir = os.path.abspath(os.environ.get("DETECTOR_MODEL_PATH",
+            "/opt/nuclio/open_model_zoo/intel/face-detection-0205/FP32"))
+        model_xml = os.path.join(base_dir, "face-detection-0205.xml")
+        model_bin = os.path.join(base_dir, "face-detection-0205.bin")
+        self.model = ModelLoader(model_xml, model_bin)
+
+    def infer(self, image, threshold):
+        infer_res = self.model.infer(image)["boxes"]
+        infer_res = infer_res[infer_res[:,4] > threshold]
+
+        results = []
+        faces = []
+        h_scale = image.height / 416
+        w_scale = image.width / 416
+        for face in infer_res:
+            xmin = int(face[0] * w_scale)
+            ymin = int(face[1] * h_scale)
+            xmax = int(face[2] * w_scale)
+            ymax = int(face[3] * h_scale)
+            confidence = face[4]
+
+            faces.append(np.array(image)[ymin:ymax, xmin:xmax])
+            results.append({
+                "confidence": str(confidence),
+                "label": "face",
+                "points": [xmin, ymin, xmax, ymax],
+                "type": "rectangle",
+                "attributes": []
+            })
+
+        return results, faces
+
+class AttributesExtractorHandler:
+    def __init__(self):
+        age_gender_base_dir = os.path.abspath(os.environ.get("AGE_GENDER_MODEL_PATH",
+            "/opt/nuclio/open_model_zoo/intel/age-gender-recognition-retail-0013/FP32"))
+        age_gender_model_xml = os.path.join(age_gender_base_dir, "age-gender-recognition-retail-0013.xml")
+        age_gender_model_bin = os.path.join(age_gender_base_dir, "age-gender-recognition-retail-0013.bin")
+        self.age_gender_model = ModelLoader(age_gender_model_xml, age_gender_model_bin)
+        emotions_base_dir = os.path.abspath(os.environ.get("EMOTIONS_MODEL_PATH",
+            "/opt/nuclio/open_model_zoo/intel/emotions-recognition-retail-0003/FP32"))
+        emotions_model_xml = os.path.join(emotions_base_dir, "emotions-recognition-retail-0003.xml")
+        emotions_model_bin = os.path.join(emotions_base_dir, "emotions-recognition-retail-0003.bin")
+        self.emotions_model = ModelLoader(emotions_model_xml, emotions_model_bin)
+        self.genders_map = ["female", "male"]
+        self.emotions_map = ["neutral", "happy", "sad", "surprise", "anger"]
+
+    def infer(self, image):
+        age_gender_request = self.age_gender_model.async_infer(image)
+        emotions_request = self.emotions_model.async_infer(image)
+        # Wait until both age_gender and emotion recognition async inferences finish
+        while not (age_gender_request.wait(0) == 0 and emotions_request.wait(0) == 0):
+            continue
+        age = int(np.squeeze(age_gender_request.output_blobs["age_conv3"].buffer) * 100)
+        gender = self.genders_map[np.argmax(np.squeeze(age_gender_request.output_blobs["prob"].buffer))]
+        emotion = self.emotions_map[np.argmax(np.squeeze(emotions_request.output_blobs['prob_emotion'].buffer))]
+        return {"attributes": [
+            {"name": "age", "value": str(age)},
+            {"name": "gender", "value": gender},
+            {"name": "emotion", "value": emotion}
+        ]}