From e225c380920dc4b31f876934bc4b041f07bf60c3 Mon Sep 17 00:00:00 2001 From: Boris Sekachev <40690378+bsekachev@users.noreply.github.com> Date: Fri, 8 Feb 2019 15:59:10 +0300 Subject: [PATCH] Re-Identification application (#299) --- .remarkrc.js | 16 ++ CHANGELOG.md | 1 + Dockerfile | 15 +- .../engine/static/engine/js/annotationUI.js | 9 +- cvat/apps/reid/README.md | 22 ++ cvat/apps/reid/__init__.py | 9 + cvat/apps/reid/apps.py | 8 + cvat/apps/reid/reid.py | 226 ++++++++++++++++++ cvat/apps/reid/static/reid/js/enginePlugin.js | 170 +++++++++++++ cvat/apps/reid/urls.py | 12 + cvat/apps/reid/views.py | 96 ++++++++ cvat/settings/base.py | 3 + cvat/urls.py | 3 + 13 files changed, 584 insertions(+), 6 deletions(-) create mode 100644 .remarkrc.js create mode 100644 cvat/apps/reid/README.md create mode 100644 cvat/apps/reid/__init__.py create mode 100644 cvat/apps/reid/apps.py create mode 100644 cvat/apps/reid/reid.py create mode 100644 cvat/apps/reid/static/reid/js/enginePlugin.js create mode 100644 cvat/apps/reid/urls.py create mode 100644 cvat/apps/reid/views.py diff --git a/.remarkrc.js b/.remarkrc.js new file mode 100644 index 000000000000..23862ca44441 --- /dev/null +++ b/.remarkrc.js @@ -0,0 +1,16 @@ +exports.settings = {bullet: '*', paddedTable: false} + +exports.plugins = [ + require('remark-preset-lint-recommended'), + require('remark-preset-lint-consistent'), + require('remark-validate-links'), + [require("remark-lint-no-dead-urls"), { skipOffline: true }], + [require("remark-lint-maximum-line-length"), 120], + [require("remark-lint-maximum-heading-length"), 120], + [require("remark-lint-list-item-indent"), "tab-size"], + [require("remark-lint-list-item-spacing"), false], + [require("remark-lint-strong-marker"), "*"], + [require("remark-lint-emphasis-marker"), "_"], + [require("remark-lint-unordered-list-marker-style"), "-"], + [require("remark-lint-ordered-list-marker-style"), "."], +] diff --git a/CHANGELOG.md b/CHANGELOG.md index 6097e3648355..d2bf4c9ba669 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -8,6 +8,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0 ### Added - OpenVINO auto annotation: it is possible to upload a custom model and annotate images automatically. - Ability to rotate images/video in the client part (Ctrl+R, Shift+Ctrl+R shortcuts) (#305) +- The ReID application for automatic bounding box merging has been added (#299) ### Changed - Propagation setup has been moved from settings to bottom player panel diff --git a/Dockerfile b/Dockerfile index 97f84c3f0f43..48dbe177843d 100644 --- a/Dockerfile +++ b/Dockerfile @@ -103,14 +103,11 @@ RUN if [ "$WITH_TESTS" = "yes" ]; then \ COPY cvat/requirements/ /tmp/requirements/ COPY supervisord.conf mod_wsgi.conf wait-for-it.sh manage.py ${HOME}/ RUN pip3 install --no-cache-dir -r /tmp/requirements/${DJANGO_CONFIGURATION}.txt -COPY cvat/ ${HOME}/cvat - -COPY ssh ${HOME}/.ssh # Install git application dependencies RUN apt-get update && \ apt-get install -y ssh netcat-openbsd git curl zip && \ - curl -s https://packagecloud.io/install/repositories/github/git-lfs/script.deb.sh | bash && \ + wget -qO /dev/stdout https://packagecloud.io/install/repositories/github/git-lfs/script.deb.sh | bash && \ apt-get install -y git-lfs && \ git lfs install && \ rm -rf /var/lib/apt/lists/* && \ @@ -120,6 +117,16 @@ RUN apt-get update && \ echo export "GIT_SSH_COMMAND=\"ssh -o StrictHostKeyChecking=no -o ConnectTimeout=30 -o ProxyCommand='nc -X 5 -x ${socks_proxy} %h %p'\"" >> ${HOME}/.bashrc; \ fi +# Download model for re-identification app +ENV REID_MODEL_DIR=${HOME}/reid +RUN if [ "$OPENVINO_TOOLKIT" = "yes" ]; then \ + mkdir ${HOME}/reid && \ + wget https://download.01.org/openvinotoolkit/2018_R5/open_model_zoo/person-reidentification-retail-0079/FP32/person-reidentification-retail-0079.xml -O reid/reid.xml && \ + wget https://download.01.org/openvinotoolkit/2018_R5/open_model_zoo/person-reidentification-retail-0079/FP32/person-reidentification-retail-0079.bin -O reid/reid.bin; \ + fi + +COPY ssh ${HOME}/.ssh +COPY cvat/ ${HOME}/cvat COPY tests ${HOME}/tests RUN patch -p1 < ${HOME}/cvat/apps/engine/static/engine/js/3rdparty.patch RUN chown -R ${USER}:${USER} . diff --git a/cvat/apps/engine/static/engine/js/annotationUI.js b/cvat/apps/engine/static/engine/js/annotationUI.js index c351f4c5e614..58b306c1e2d4 100644 --- a/cvat/apps/engine/static/engine/js/annotationUI.js +++ b/cvat/apps/engine/static/engine/js/annotationUI.js @@ -159,7 +159,12 @@ function buildAnnotationUI(job, shapeData, loadJobEvent) { window.cvat.data = { get: () => shapeCollectionModel.exportAll(), set: (data) => { - shapeCollectionModel.empty(); + for (let type in data) { + for (let shape of data[type]) { + shape.id = idGenerator.next(); + } + } + shapeCollectionModel.import(data, false); shapeCollectionModel.update(); }, @@ -248,7 +253,7 @@ function buildAnnotationUI(job, shapeData, loadJobEvent) { $(window).on('click', function(event) { Logger.updateUserActivityTimer(); - if (event.target.classList.contains('modal')) { + if (event.target.classList.contains('modal') && !event.target.classList.contains('force-modal')) { event.target.classList.add('hidden'); } }); diff --git a/cvat/apps/reid/README.md b/cvat/apps/reid/README.md new file mode 100644 index 000000000000..8cf29c503781 --- /dev/null +++ b/cvat/apps/reid/README.md @@ -0,0 +1,22 @@ +# Re-Identification Application + +## About the application + +The ReID application uses deep learning model to perform an automatic bbox merging between neighbor frames. +You can use "Merge" and "Split" functionality to edit automatically generated annotation. + +## Installation + +This application will be installed automatically with the [OpenVINO](https://github.com/opencv/cvat/blob/develop/components/openvino/README.md) component. + +## Running + +For starting the ReID merge process: + +- Open an annotation job +- Open the menu +- Click the "Run ReID Merge" button +- Click the "Submit" button. Also here you can experiment with values of model threshold or maximum distance. + - Model threshold is maximum cosine distance between objects embeddings. + - Maximum distance defines a maximum radius that an object can diverge between neightbor frames. +- The process will be run. You can cancel it in the menu. diff --git a/cvat/apps/reid/__init__.py b/cvat/apps/reid/__init__.py new file mode 100644 index 000000000000..4a9759cc68f5 --- /dev/null +++ b/cvat/apps/reid/__init__.py @@ -0,0 +1,9 @@ +# Copyright (C) 2018 Intel Corporation +# +# SPDX-License-Identifier: MIT + +from cvat.settings.base import JS_3RDPARTY + +default_app_config = 'cvat.apps.reid.apps.ReidConfig' + +JS_3RDPARTY['engine'] = JS_3RDPARTY.get('engine', []) + ['reid/js/enginePlugin.js'] diff --git a/cvat/apps/reid/apps.py b/cvat/apps/reid/apps.py new file mode 100644 index 000000000000..f6aa66e1a5f9 --- /dev/null +++ b/cvat/apps/reid/apps.py @@ -0,0 +1,8 @@ +# Copyright (C) 2018 Intel Corporation +# +# SPDX-License-Identifier: MIT + +from django.apps import AppConfig + +class ReidConfig(AppConfig): + name = 'cvat.apps.reid' diff --git a/cvat/apps/reid/reid.py b/cvat/apps/reid/reid.py new file mode 100644 index 000000000000..915359b3e11a --- /dev/null +++ b/cvat/apps/reid/reid.py @@ -0,0 +1,226 @@ +# Copyright (C) 2018 Intel Corporation +# +# SPDX-License-Identifier: MIT + +import os +import rq +import cv2 +import math +import numpy +import fnmatch + +from openvino.inference_engine import IENetwork, IEPlugin +from scipy.optimize import linear_sum_assignment +from scipy.spatial.distance import euclidean, cosine + +from cvat.apps.engine.models import Job + + +class ReID: + __threshold = None + __max_distance = None + __frame_urls = None + __frame_boxes = None + __stop_frame = None + __plugin = None + __executable_network = None + __input_blob_name = None + __output_blob_name = None + __input_height = None + __input_width = None + + + def __init__(self, jid, data): + self.__threshold = data["threshold"] + self.__max_distance = data["maxDistance"] + self.__frame_urls = {} + self.__frame_boxes = {} + + db_job = Job.objects.select_related('segment__task').get(pk = jid) + db_segment = db_job.segment + db_task = db_segment.task + + self.__stop_frame = db_segment.stop_frame + + for root, _, filenames in os.walk(db_task.get_data_dirname()): + for filename in fnmatch.filter(filenames, '*.jpg'): + frame = int(os.path.splitext(filename)[0]) + if frame >= db_segment.start_frame and frame <= db_segment.stop_frame: + self.__frame_urls[frame] = os.path.join(root, filename) + + for frame in self.__frame_urls: + self.__frame_boxes[frame] = [box for box in data["boxes"] if box["frame"] == frame] + + IE_PLUGINS_PATH = os.getenv('IE_PLUGINS_PATH', None) + REID_MODEL_DIR = os.getenv('REID_MODEL_DIR', None) + + if not IE_PLUGINS_PATH: + raise Exception("Environment variable 'IE_PLUGINS_PATH' isn't defined") + if not REID_MODEL_DIR: + raise Exception("Environment variable 'REID_MODEL_DIR' isn't defined") + + REID_XML = os.path.join(REID_MODEL_DIR, "reid.xml") + REID_BIN = os.path.join(REID_MODEL_DIR, "reid.bin") + + self.__plugin = IEPlugin(device="CPU", plugin_dirs=[IE_PLUGINS_PATH]) + network = IENetwork.from_ir(model=REID_XML, weights=REID_BIN) + self.__input_blob_name = next(iter(network.inputs)) + self.__output_blob_name = next(iter(network.outputs)) + self.__input_height, self.__input_width = network.inputs[self.__input_blob_name].shape[-2:] + self.__executable_network = self.__plugin.load(network=network) + del network + + + def __del__(self): + if self.__executable_network: + del self.__executable_network + self.__executable_network = None + + if self.__plugin: + del self.__plugin + self.__plugin = None + + + def __boxes_are_compatible(self, cur_box, next_box): + cur_c_x = (cur_box["xtl"] + cur_box["xbr"]) / 2 + cur_c_y = (cur_box["ytl"] + cur_box["ybr"]) / 2 + next_c_x = (next_box["xtl"] + next_box["xbr"]) / 2 + next_c_y = (next_box["ytl"] + next_box["ybr"]) / 2 + compatible_distance = euclidean([cur_c_x, cur_c_y], [next_c_x, next_c_y]) <= self.__max_distance + compatible_label = cur_box["label_id"] == next_box["label_id"] + return compatible_distance and compatible_label and "path_id" not in next_box + + + def __compute_difference(self, image_1, image_2): + image_1 = cv2.resize(image_1, (self.__input_width, self.__input_height)).transpose((2,0,1)) + image_2 = cv2.resize(image_2, (self.__input_width, self.__input_height)).transpose((2,0,1)) + + input_1 = { + self.__input_blob_name: image_1[numpy.newaxis, ...] + } + + input_2 = { + self.__input_blob_name: image_2[numpy.newaxis, ...] + } + + embedding_1 = self.__executable_network.infer(inputs = input_1)[self.__output_blob_name] + embedding_2 = self.__executable_network.infer(inputs = input_2)[self.__output_blob_name] + + embedding_1 = embedding_1.reshape(embedding_1.size) + embedding_2 = embedding_2.reshape(embedding_2.size) + + return cosine(embedding_1, embedding_2) + + + def __compute_difference_matrix(self, cur_boxes, next_boxes, cur_image, next_image): + def _int(number, upper): + return math.floor(numpy.clip(number, 0, upper - 1)) + + default_mat_value = 1000.0 + + matrix = numpy.full([len(cur_boxes), len(next_boxes)], default_mat_value, dtype=float) + for row, cur_box in enumerate(cur_boxes): + cur_width = cur_image.shape[1] + cur_height = cur_image.shape[0] + cur_xtl, cur_xbr, cur_ytl, cur_ybr = ( + _int(cur_box["xtl"], cur_width), _int(cur_box["xbr"], cur_width), + _int(cur_box["ytl"], cur_height), _int(cur_box["ybr"], cur_height) + ) + + for col, next_box in enumerate(next_boxes): + next_box = next_boxes[col] + next_width = next_image.shape[1] + next_height = next_image.shape[0] + next_xtl, next_xbr, next_ytl, next_ybr = ( + _int(next_box["xtl"], next_width), _int(next_box["xbr"], next_width), + _int(next_box["ytl"], next_height), _int(next_box["ybr"], next_height) + ) + + if not self.__boxes_are_compatible(cur_box, next_box): + continue + + crop_1 = cur_image[cur_ytl:cur_ybr, cur_xtl:cur_xbr] + crop_2 = next_image[next_ytl:next_ybr, next_xtl:next_xbr] + matrix[row][col] = self.__compute_difference(crop_1, crop_2) + + return matrix + + + def __apply_matching(self): + frames = sorted(list(self.__frame_boxes.keys())) + job = rq.get_current_job() + box_paths = {} + + for idx, (cur_frame, next_frame) in enumerate(list(zip(frames[:-1], frames[1:]))): + job.refresh() + if "cancel" in job.meta: + return None + + job.meta["progress"] = idx * 100.0 / len(frames) + job.save_meta() + + cur_boxes = self.__frame_boxes[cur_frame] + next_boxes = self.__frame_boxes[next_frame] + + for box in cur_boxes: + if "path_id" not in box: + path_id = len(box_paths) + box_paths[path_id] = [box] + box["path_id"] = path_id + + if not (len(cur_boxes) and len(next_boxes)): + continue + + cur_image = cv2.imread(self.__frame_urls[cur_frame], cv2.IMREAD_COLOR) + next_image = cv2.imread(self.__frame_urls[next_frame], cv2.IMREAD_COLOR) + difference_matrix = self.__compute_difference_matrix(cur_boxes, next_boxes, cur_image, next_image) + cur_idxs, next_idxs = linear_sum_assignment(difference_matrix) + for idx, cur_idx in enumerate(cur_idxs): + if (difference_matrix[cur_idx][next_idxs[idx]]) <= self.__threshold: + cur_box = cur_boxes[cur_idx] + next_box = next_boxes[next_idxs[idx]] + next_box["path_id"] = cur_box["path_id"] + box_paths[cur_box["path_id"]].append(next_box) + + for box in self.__frame_boxes[frames[-1]]: + if "path_id" not in box: + path_id = len(box_paths) + box["path_id"] = path_id + box_paths[path_id] = [box] + + return box_paths + + + def run(self): + box_paths = self.__apply_matching() + output = [] + + # ReID process has been canceled + if box_paths is None: + return + + for path_id in box_paths: + output.append({ + "label_id": box_paths[path_id][0]["label_id"], + "group_id": 0, + "attributes": [], + "frame": box_paths[path_id][0]["frame"], + "shapes": box_paths[path_id] + }) + + for box in output[-1]["shapes"]: + del box["id"] + del box["path_id"] + del box["group_id"] + del box["label_id"] + box["outside"] = False + box["attributes"] = [] + + for path in output: + if path["shapes"][-1]["frame"] != self.__stop_frame: + copy = path["shapes"][-1].copy() + copy["outside"] = True + copy["frame"] += 1 + path["shapes"].append(copy) + + return output diff --git a/cvat/apps/reid/static/reid/js/enginePlugin.js b/cvat/apps/reid/static/reid/js/enginePlugin.js new file mode 100644 index 000000000000..6bf14377cf5a --- /dev/null +++ b/cvat/apps/reid/static/reid/js/enginePlugin.js @@ -0,0 +1,170 @@ +/* + * Copyright (C) 2018 Intel Corporation + * + * SPDX-License-Identifier: MIT + */ + +/* global showMessage userConfirm */ + + +document.addEventListener('DOMContentLoaded', () => { + function run(overlay, cancelButton, thresholdInput, distanceInput) { + const collection = window.cvat.data.get(); + const data = { + threshold: +thresholdInput.prop('value'), + maxDistance: +distanceInput.prop('value'), + boxes: collection.boxes, + }; + + overlay.removeClass('hidden'); + cancelButton.prop('disabled', true); + $.ajax({ + url: `reid/start/job/${window.cvat.job.id}`, + type: 'POST', + data: JSON.stringify(data), + contentType: 'application/json', + success: () => { + function checkCallback() { + $.ajax({ + url: `/reid/check/${window.cvat.job.id}`, + type: 'GET', + success: (jobData) => { + if (jobData.progress) { + cancelButton.text(`Cancel ReID Merge (${jobData.progress.toString().slice(0, 4)}%)`); + } + + if (['queued', 'started'].includes(jobData.status)) { + setTimeout(checkCallback, 1000); + } else { + overlay.addClass('hidden'); + + if (jobData.status === 'finished') { + if (jobData.result) { + collection.boxes = []; + collection.box_paths = collection.box_paths + .concat(JSON.parse(jobData.result)); + window.cvat.data.clear(); + window.cvat.data.set(collection); + showMessage('ReID merge has done.'); + } else { + showMessage('ReID merge been canceled.'); + } + } else if (jobData.status === 'failed') { + const message = `ReID merge has fallen. Error: '${jobData.stderr}'`; + showMessage(message); + } else { + let message = `Check request returned "${jobData.status}" status.`; + if (jobData.stderr) { + message += ` Error: ${jobData.stderr}`; + } + showMessage(message); + } + } + }, + error: (errorData) => { + overlay.addClass('hidden'); + const message = `Can not check ReID merge. Code: ${errorData.status}. Message: ${errorData.responseText || errorData.statusText}`; + showMessage(message); + }, + }); + } + + setTimeout(checkCallback, 1000); + }, + error: (errorData) => { + overlay.addClass('hidden'); + const message = `Can not start ReID merge. Code: ${errorData.status}. Message: ${errorData.responseText || errorData.statusText}`; + showMessage(message); + }, + complete: () => { + cancelButton.prop('disabled', false); + }, + }); + } + + function cancel(overlay, cancelButton) { + cancelButton.prop('disabled', true); + $.ajax({ + url: `/reid/cancel/${window.cvat.job.id}`, + type: 'GET', + success: () => { + overlay.addClass('hidden'); + cancelButton.text('Cancel ReID Merge (0%)'); + }, + error: (errorData) => { + const message = `Can not cancel ReID process. Code: ${errorData.status}. Message: ${errorData.responseText || errorData.statusText}`; + showMessage(message); + }, + complete: () => { + cancelButton.prop('disabled', false); + } + }); + } + + const buttonsUI = $('#engineMenuButtons'); + const reidWindowId = 'reidSubmitWindow'; + const reidThresholdValueId = 'reidThresholdValue'; + const reidDistanceValueId = 'reidDistanceValue'; + const reidCancelMergeId = 'reidCancelMerge'; + const reidSubmitMergeId = 'reidSubmitMerge'; + const reidCancelButtonId = 'reidCancelReID'; + const reidOverlay = 'reidOverlay'; + + $('').on('click', () => { + $('#annotationMenu').addClass('hidden'); + $(`#${reidWindowId}`).removeClass('hidden'); + }).addClass('menuButton semiBold h2').prependTo(buttonsUI); + + $(` +
+ `).appendTo('body'); + + $(` + + + `).appendTo('body'); + + $(`#${reidCancelMergeId}`).on('click', () => { + $(`#${reidWindowId}`).addClass('hidden'); + }); + + $(`#${reidCancelButtonId}`).on('click', () => { + userConfirm('ReID process will be canceld. Are you sure?', () => { + cancel($(`#${reidOverlay}`), $(`#${reidCancelButtonId}`)); + }); + }); + + $(`#${reidSubmitMergeId}`).on('click', () => { + $(`#${reidWindowId}`).addClass('hidden'); + run($(`#${reidOverlay}`), $(`#${reidCancelButtonId}`), + $(`#${reidThresholdValueId}`), $(`#${reidDistanceValueId}`)); + }); +}); diff --git a/cvat/apps/reid/urls.py b/cvat/apps/reid/urls.py new file mode 100644 index 000000000000..4decc5cf7467 --- /dev/null +++ b/cvat/apps/reid/urls.py @@ -0,0 +1,12 @@ +# Copyright (C) 2018 Intel Corporation +# +# SPDX-License-Identifier: MIT + +from django.urls import path +from . import views + +urlpatterns = [ + path('start/job/ +