Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Re-Identification application #299

Merged
merged 29 commits into from
Feb 8, 2019
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
29 commits
Select commit Hold shift + click to select a range
dbab909
ReID initial commit
bsekachev Jan 23, 2019
ed6ff96
ReID installation
bsekachev Jan 23, 2019
0855f43
Additional settings window
bsekachev Jan 23, 2019
43e3f77
Intel copiright has been added
bsekachev Jan 24, 2019
6aa5bb3
Added permissions
bsekachev Jan 24, 2019
ee0e902
ReID README.md
bsekachev Jan 24, 2019
fbb4b4f
Updated changelog
bsekachev Jan 24, 2019
d1158c2
Dockerfile has been updated
bsekachev Jan 24, 2019
060333f
Codacy fixes
bsekachev Jan 25, 2019
a8abda8
Grammar fix
bsekachev Jan 25, 2019
9805251
Application config
bsekachev Jan 25, 2019
0f10663
Merge branch 'develop' into bs/reid
bsekachev Jan 30, 2019
0f1aade
Some codacy fixes
bsekachev Jan 30, 2019
ddbb4ee
Fixed confirm
bsekachev Jan 31, 2019
c2f15a7
Codacy fixes
bsekachev Jan 31, 2019
d97d677
Codacy fixes
bsekachev Jan 31, 2019
684f355
Codacy fixes
bsekachev Jan 31, 2019
c465bfc
Fixed README.md
bsekachev Jan 31, 2019
0a63f58
ITGalaxy remark lint config
bsekachev Jan 31, 2019
01faa14
Fixed codacy issues
bsekachev Jan 31, 2019
d95549c
Removed config
bsekachev Feb 1, 2019
bea0649
RemarkLint config has been added
bsekachev Feb 1, 2019
9002789
RemarkLint config has been updated
bsekachev Feb 1, 2019
931cb97
Removed animations
bsekachev Feb 4, 2019
4344f0b
Removed extra permissions
bsekachev Feb 4, 2019
c8e6b22
Merge branch 'develop' into bs/reid
bsekachev Feb 5, 2019
c8bfc9a
Hints for inputs. Overlay during ReId processing
bsekachev Feb 7, 2019
8f28165
Fixed typos
bsekachev Feb 7, 2019
2f9b5a0
Fixed typos neightbor -> neighbor
bsekachev Feb 8, 2019
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
16 changes: 16 additions & 0 deletions .remarkrc.js
Original file line number Diff line number Diff line change
@@ -0,0 +1,16 @@
exports.settings = {bullet: '*', paddedTable: false}

exports.plugins = [
require('remark-preset-lint-recommended'),
require('remark-preset-lint-consistent'),
require('remark-validate-links'),
[require("remark-lint-no-dead-urls"), { skipOffline: true }],
[require("remark-lint-maximum-line-length"), 120],
[require("remark-lint-maximum-heading-length"), 120],
[require("remark-lint-list-item-indent"), "tab-size"],
[require("remark-lint-list-item-spacing"), false],
[require("remark-lint-strong-marker"), "*"],
[require("remark-lint-emphasis-marker"), "_"],
[require("remark-lint-unordered-list-marker-style"), "-"],
[require("remark-lint-ordered-list-marker-style"), "."],
]
1 change: 1 addition & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,7 @@ and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0
### Added
- OpenVINO auto annotation: it is possible to upload a custom model and annotate images automatically.
- Ability to rotate images/video in the client part (Ctrl+R, Shift+Ctrl+R shortcuts) (#305)
- The ReID application for automatic bounding box merging has been added (#299)

### Changed
- Propagation setup has been moved from settings to bottom player panel
Expand Down
15 changes: 11 additions & 4 deletions Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -103,14 +103,11 @@ RUN if [ "$WITH_TESTS" = "yes" ]; then \
COPY cvat/requirements/ /tmp/requirements/
COPY supervisord.conf mod_wsgi.conf wait-for-it.sh manage.py ${HOME}/
RUN pip3 install --no-cache-dir -r /tmp/requirements/${DJANGO_CONFIGURATION}.txt
COPY cvat/ ${HOME}/cvat

COPY ssh ${HOME}/.ssh

# Install git application dependencies
RUN apt-get update && \
apt-get install -y ssh netcat-openbsd git curl zip && \
curl -s https://packagecloud.io/install/repositories/github/git-lfs/script.deb.sh | bash && \
wget -qO /dev/stdout https://packagecloud.io/install/repositories/github/git-lfs/script.deb.sh | bash && \
apt-get install -y git-lfs && \
git lfs install && \
rm -rf /var/lib/apt/lists/* && \
Expand All @@ -120,6 +117,16 @@ RUN apt-get update && \
echo export "GIT_SSH_COMMAND=\"ssh -o StrictHostKeyChecking=no -o ConnectTimeout=30 -o ProxyCommand='nc -X 5 -x ${socks_proxy} %h %p'\"" >> ${HOME}/.bashrc; \
fi

# Download model for re-identification app
ENV REID_MODEL_DIR=${HOME}/reid
RUN if [ "$OPENVINO_TOOLKIT" = "yes" ]; then \
mkdir ${HOME}/reid && \
wget https://download.01.org/openvinotoolkit/2018_R5/open_model_zoo/person-reidentification-retail-0079/FP32/person-reidentification-retail-0079.xml -O reid/reid.xml && \
wget https://download.01.org/openvinotoolkit/2018_R5/open_model_zoo/person-reidentification-retail-0079/FP32/person-reidentification-retail-0079.bin -O reid/reid.bin; \
fi

COPY ssh ${HOME}/.ssh
COPY cvat/ ${HOME}/cvat
COPY tests ${HOME}/tests
RUN patch -p1 < ${HOME}/cvat/apps/engine/static/engine/js/3rdparty.patch
RUN chown -R ${USER}:${USER} .
Expand Down
9 changes: 7 additions & 2 deletions cvat/apps/engine/static/engine/js/annotationUI.js
Original file line number Diff line number Diff line change
Expand Up @@ -159,7 +159,12 @@ function buildAnnotationUI(job, shapeData, loadJobEvent) {
window.cvat.data = {
get: () => shapeCollectionModel.exportAll(),
set: (data) => {
shapeCollectionModel.empty();
for (let type in data) {
for (let shape of data[type]) {
shape.id = idGenerator.next();
}
}

shapeCollectionModel.import(data, false);
shapeCollectionModel.update();
},
Expand Down Expand Up @@ -248,7 +253,7 @@ function buildAnnotationUI(job, shapeData, loadJobEvent) {

$(window).on('click', function(event) {
Logger.updateUserActivityTimer();
if (event.target.classList.contains('modal')) {
if (event.target.classList.contains('modal') && !event.target.classList.contains('force-modal')) {
event.target.classList.add('hidden');
}
});
Expand Down
22 changes: 22 additions & 0 deletions cvat/apps/reid/README.md
Original file line number Diff line number Diff line change
@@ -0,0 +1,22 @@
# Re-Identification Application

## About the application

The ReID application uses deep learning model to perform an automatic bbox merging between neighbor frames.
You can use "Merge" and "Split" functionality to edit automatically generated annotation.

## Installation

This application will be installed automatically with the [OpenVINO](https://github.com/opencv/cvat/blob/develop/components/openvino/README.md) component.

## Running

For starting the ReID merge process:

- Open an annotation job
- Open the menu
- Click the "Run ReID Merge" button
- Click the "Submit" button. Also here you can experiment with values of model threshold or maximum distance.
- Model threshold is maximum cosine distance between objects embeddings.
- Maximum distance defines a maximum radius that an object can diverge between neightbor frames.
- The process will be run. You can cancel it in the menu.
9 changes: 9 additions & 0 deletions cvat/apps/reid/__init__.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
# Copyright (C) 2018 Intel Corporation
#
# SPDX-License-Identifier: MIT

from cvat.settings.base import JS_3RDPARTY

default_app_config = 'cvat.apps.reid.apps.ReidConfig'

JS_3RDPARTY['engine'] = JS_3RDPARTY.get('engine', []) + ['reid/js/enginePlugin.js']
8 changes: 8 additions & 0 deletions cvat/apps/reid/apps.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,8 @@
# Copyright (C) 2018 Intel Corporation
#
# SPDX-License-Identifier: MIT

from django.apps import AppConfig

class ReidConfig(AppConfig):
name = 'cvat.apps.reid'
226 changes: 226 additions & 0 deletions cvat/apps/reid/reid.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,226 @@
# Copyright (C) 2018 Intel Corporation
#
# SPDX-License-Identifier: MIT

import os
import rq
import cv2
import math
import numpy
import fnmatch

from openvino.inference_engine import IENetwork, IEPlugin
from scipy.optimize import linear_sum_assignment
from scipy.spatial.distance import euclidean, cosine

from cvat.apps.engine.models import Job


class ReID:
__threshold = None
__max_distance = None
__frame_urls = None
__frame_boxes = None
__stop_frame = None
__plugin = None
__executable_network = None
__input_blob_name = None
__output_blob_name = None
__input_height = None
__input_width = None


def __init__(self, jid, data):
self.__threshold = data["threshold"]
self.__max_distance = data["maxDistance"]
self.__frame_urls = {}
self.__frame_boxes = {}

db_job = Job.objects.select_related('segment__task').get(pk = jid)
db_segment = db_job.segment
db_task = db_segment.task

self.__stop_frame = db_segment.stop_frame

for root, _, filenames in os.walk(db_task.get_data_dirname()):
for filename in fnmatch.filter(filenames, '*.jpg'):
frame = int(os.path.splitext(filename)[0])
if frame >= db_segment.start_frame and frame <= db_segment.stop_frame:
self.__frame_urls[frame] = os.path.join(root, filename)

for frame in self.__frame_urls:
self.__frame_boxes[frame] = [box for box in data["boxes"] if box["frame"] == frame]

IE_PLUGINS_PATH = os.getenv('IE_PLUGINS_PATH', None)
REID_MODEL_DIR = os.getenv('REID_MODEL_DIR', None)

if not IE_PLUGINS_PATH:
raise Exception("Environment variable 'IE_PLUGINS_PATH' isn't defined")
if not REID_MODEL_DIR:
raise Exception("Environment variable 'REID_MODEL_DIR' isn't defined")

REID_XML = os.path.join(REID_MODEL_DIR, "reid.xml")
REID_BIN = os.path.join(REID_MODEL_DIR, "reid.bin")

self.__plugin = IEPlugin(device="CPU", plugin_dirs=[IE_PLUGINS_PATH])
network = IENetwork.from_ir(model=REID_XML, weights=REID_BIN)
self.__input_blob_name = next(iter(network.inputs))
self.__output_blob_name = next(iter(network.outputs))
self.__input_height, self.__input_width = network.inputs[self.__input_blob_name].shape[-2:]
self.__executable_network = self.__plugin.load(network=network)
del network


def __del__(self):
if self.__executable_network:
del self.__executable_network
self.__executable_network = None

if self.__plugin:
del self.__plugin
self.__plugin = None


def __boxes_are_compatible(self, cur_box, next_box):
cur_c_x = (cur_box["xtl"] + cur_box["xbr"]) / 2
cur_c_y = (cur_box["ytl"] + cur_box["ybr"]) / 2
next_c_x = (next_box["xtl"] + next_box["xbr"]) / 2
next_c_y = (next_box["ytl"] + next_box["ybr"]) / 2
compatible_distance = euclidean([cur_c_x, cur_c_y], [next_c_x, next_c_y]) <= self.__max_distance
compatible_label = cur_box["label_id"] == next_box["label_id"]
return compatible_distance and compatible_label and "path_id" not in next_box


def __compute_difference(self, image_1, image_2):
image_1 = cv2.resize(image_1, (self.__input_width, self.__input_height)).transpose((2,0,1))
image_2 = cv2.resize(image_2, (self.__input_width, self.__input_height)).transpose((2,0,1))

input_1 = {
self.__input_blob_name: image_1[numpy.newaxis, ...]
}

input_2 = {
self.__input_blob_name: image_2[numpy.newaxis, ...]
}

embedding_1 = self.__executable_network.infer(inputs = input_1)[self.__output_blob_name]
embedding_2 = self.__executable_network.infer(inputs = input_2)[self.__output_blob_name]

embedding_1 = embedding_1.reshape(embedding_1.size)
embedding_2 = embedding_2.reshape(embedding_2.size)

return cosine(embedding_1, embedding_2)


def __compute_difference_matrix(self, cur_boxes, next_boxes, cur_image, next_image):
def _int(number, upper):
return math.floor(numpy.clip(number, 0, upper - 1))

default_mat_value = 1000.0

matrix = numpy.full([len(cur_boxes), len(next_boxes)], default_mat_value, dtype=float)
for row, cur_box in enumerate(cur_boxes):
cur_width = cur_image.shape[1]
cur_height = cur_image.shape[0]
cur_xtl, cur_xbr, cur_ytl, cur_ybr = (
_int(cur_box["xtl"], cur_width), _int(cur_box["xbr"], cur_width),
_int(cur_box["ytl"], cur_height), _int(cur_box["ybr"], cur_height)
)

for col, next_box in enumerate(next_boxes):
next_box = next_boxes[col]
next_width = next_image.shape[1]
next_height = next_image.shape[0]
next_xtl, next_xbr, next_ytl, next_ybr = (
_int(next_box["xtl"], next_width), _int(next_box["xbr"], next_width),
_int(next_box["ytl"], next_height), _int(next_box["ybr"], next_height)
)

if not self.__boxes_are_compatible(cur_box, next_box):
continue

crop_1 = cur_image[cur_ytl:cur_ybr, cur_xtl:cur_xbr]
crop_2 = next_image[next_ytl:next_ybr, next_xtl:next_xbr]
matrix[row][col] = self.__compute_difference(crop_1, crop_2)

return matrix


def __apply_matching(self):
frames = sorted(list(self.__frame_boxes.keys()))
job = rq.get_current_job()
box_paths = {}

for idx, (cur_frame, next_frame) in enumerate(list(zip(frames[:-1], frames[1:]))):
job.refresh()
if "cancel" in job.meta:
return None

job.meta["progress"] = idx * 100.0 / len(frames)
job.save_meta()

cur_boxes = self.__frame_boxes[cur_frame]
next_boxes = self.__frame_boxes[next_frame]

for box in cur_boxes:
if "path_id" not in box:
path_id = len(box_paths)
box_paths[path_id] = [box]
box["path_id"] = path_id

if not (len(cur_boxes) and len(next_boxes)):
continue

cur_image = cv2.imread(self.__frame_urls[cur_frame], cv2.IMREAD_COLOR)
next_image = cv2.imread(self.__frame_urls[next_frame], cv2.IMREAD_COLOR)
difference_matrix = self.__compute_difference_matrix(cur_boxes, next_boxes, cur_image, next_image)
cur_idxs, next_idxs = linear_sum_assignment(difference_matrix)
for idx, cur_idx in enumerate(cur_idxs):
if (difference_matrix[cur_idx][next_idxs[idx]]) <= self.__threshold:
cur_box = cur_boxes[cur_idx]
next_box = next_boxes[next_idxs[idx]]
next_box["path_id"] = cur_box["path_id"]
box_paths[cur_box["path_id"]].append(next_box)

for box in self.__frame_boxes[frames[-1]]:
if "path_id" not in box:
path_id = len(box_paths)
box["path_id"] = path_id
box_paths[path_id] = [box]

return box_paths


def run(self):
box_paths = self.__apply_matching()
output = []

# ReID process has been canceled
if box_paths is None:
nmanovic marked this conversation as resolved.
Show resolved Hide resolved
return

for path_id in box_paths:
output.append({
"label_id": box_paths[path_id][0]["label_id"],
"group_id": 0,
"attributes": [],
"frame": box_paths[path_id][0]["frame"],
"shapes": box_paths[path_id]
})

for box in output[-1]["shapes"]:
del box["id"]
del box["path_id"]
del box["group_id"]
del box["label_id"]
box["outside"] = False
box["attributes"] = []

for path in output:
if path["shapes"][-1]["frame"] != self.__stop_frame:
copy = path["shapes"][-1].copy()
copy["outside"] = True
copy["frame"] += 1
path["shapes"].append(copy)

return output
Loading